-
Notifications
You must be signed in to change notification settings - Fork 0
/
ticcl_nf.cwl
85 lines (78 loc) · 1.58 KB
/
ticcl_nf.cwl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
#!/usr/bin/env cwl-runner
cwlVersion: v1.0
class: CommandLineTool
baseCommand: "ticcl.nf"
hints:
- class: DockerRequirement
dockerPull: egpbos/lamachine:piccl
doc: |
Run TICCL nextflow pipeline.
Corrects OCR errors in the documents in the input directory.
requirements:
EnvVarRequirement:
envDef:
LC_ALL: C.UTF-8
LANG: C.UTF-8
inputs:
# mandatory ticcl.nf parameters:
input_dir:
type: Directory
inputBinding:
prefix: --inputdir
lexicon_file:
type: File
inputBinding:
prefix: --lexicon
alphabet_file:
type: File
inputBinding:
prefix: --alphabet
character_confusion_file:
type: File
inputBinding:
prefix: --charconfus
# optional ticcl.nf parameters:
output_dir:
type: Directory?
inputBinding:
prefix: --outputdir
language:
type: string?
inputBinding:
prefix: --language
input_extension:
type: string?
inputBinding:
prefix: --extension
input_class:
type: string?
inputBinding:
prefix: --inputclass
input_type:
type: string?
inputBinding:
prefix: --inputtype
virtual_env:
type: Directory?
inputBinding:
prefix: --virtualenv
artificial_frequency_lexicon_words:
type: int?
inputBinding:
prefix: --artifrq
levenshtein_distance:
type: int?
inputBinding:
prefix: --distance
clip_below:
type: int?
inputBinding:
prefix: --clip
corpus_frequency_file:
type: File?
inputBinding:
prefix: --corpusfreqlist
stdout: cwl.output.json
outputs:
out_files:
type: File[]