diff --git a/.gitattributes b/.gitattributes index d4b9ec5eb8c5b407b3bcb6cad652b692ad279b21..a11579eb388f26d035b1fc223e5db1b88795a145 100644 --- a/.gitattributes +++ b/.gitattributes @@ -169,3 +169,4 @@ data/train_NER/20190109_train_NER.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1970/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1971/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text data/train_NER/20190116_train_NER_french.tar.gz filter=lfs diff=lfs merge=lfs -text +data/AB/1972/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text diff --git a/.renku/workflow/a29a24b4b00f4b7eaf5540b98f81966a_python.cwl b/.renku/workflow/a29a24b4b00f4b7eaf5540b98f81966a_python.cwl new file mode 100644 index 0000000000000000000000000000000000000000..b150efbbbc130a6cd49b09485c7493eb99a6bd16 --- /dev/null +++ b/.renku/workflow/a29a24b4b00f4b7eaf5540b98f81966a_python.cwl @@ -0,0 +1,51 @@ +arguments: [] +baseCommand: +- python +class: CommandLineTool +cwlVersion: v1.0 +hints: [] +inputs: + input_1: + default: + class: File + path: ../../src/python/run_correctxml.py + inputBinding: + position: 1 + separate: true + shellQuote: true + streamable: false + type: File + input_2: + default: + class: File + path: ../../data/AB/1972/02_extractedxml.tar.gz + inputBinding: + position: 2 + separate: true + shellQuote: true + streamable: false + type: File + input_3: + default: data/AB/1972/04_correctedxml.tar.gz + inputBinding: + position: 3 + separate: true + shellQuote: true + streamable: false + type: string +outputs: + output_0: + outputBinding: + glob: $(inputs.input_3) + streamable: false + type: File +permanentFailCodes: [] +requirements: +- class: InlineJavascriptRequirement +- class: InitialWorkDirRequirement + listing: + - entry: '$({"listing": [], "class": "Directory"})' + entryname: data/AB/1972 + writable: true +successCodes: [] +temporaryFailCodes: [] diff --git a/data/AB/1972/04_correctedxml.tar.gz b/data/AB/1972/04_correctedxml.tar.gz new file mode 100644 index 0000000000000000000000000000000000000000..a936494ecf16a998574d4505b08ae421d9539c1e --- /dev/null +++ b/data/AB/1972/04_correctedxml.tar.gz @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc2b7da468479d966114d65d094869b5cb0d362805397138b98783b4f61187c +size 32454837