Skip to content
Snippets Groups Projects
Commit 6a3a6624 authored by Lili Gasser's avatar Lili Gasser
Browse files

Merge branch 'master' into 'update-mp-extraction'

# Conflicts:
#   .gitattributes
parents 596eaea9 86b84bab
No related branches found
No related tags found
No related merge requests found
Showing
with 645 additions and 0 deletions
...@@ -169,6 +169,7 @@ data/train_NER/20190109_train_NER.tar.gz filter=lfs diff=lfs merge=lfs -text ...@@ -169,6 +169,7 @@ data/train_NER/20190109_train_NER.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1970/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1970/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1971/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1971/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/train_NER/20190116_train_NER_french.tar.gz filter=lfs diff=lfs merge=lfs -text data/train_NER/20190116_train_NER_french.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1972/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1926/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1926/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1927/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1927/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1928/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1928/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text
...@@ -241,3 +242,14 @@ data/AB/1994/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text ...@@ -241,3 +242,14 @@ data/AB/1994/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1995/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text data/AB/1995/03_correctedmeta.tar.gz filter=lfs diff=lfs merge=lfs -text
data/politicians/MPs_after1890.csv filter=lfs diff=lfs merge=lfs -text data/politicians/MPs_after1890.csv filter=lfs diff=lfs merge=lfs -text
data/politicians/lastnames/** filter=lfs diff=lfs merge=lfs -text data/politicians/lastnames/** filter=lfs diff=lfs merge=lfs -text
data/AB/1973/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1975/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1976/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1974/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1980/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1981/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1977/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1982/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1983/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1991/02_extractedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
data/AB/1991/04_correctedxml.tar.gz filter=lfs diff=lfs merge=lfs -text
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_correctxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1973/02_extractedxml.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1973/04_correctedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1973
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1981/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1981/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1981
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1991/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1991/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1991
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1980/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1980/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1980
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1982/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1982/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1982
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_correctxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1972/02_extractedxml.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1972/04_correctedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1972
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_correctxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1991/02_extractedxml.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1991/04_correctedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1991
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1983/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1983/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1983
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1975/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1975/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1975
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_correctxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1974/02_extractedxml.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1974/04_correctedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1974
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1977/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1977/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1977
writable: true
successCodes: []
temporaryFailCodes: []
arguments: []
baseCommand:
- python
class: CommandLineTool
cwlVersion: v1.0
hints: []
inputs:
input_1:
default:
class: File
path: ../../src/python/run_extract_origxml.py
inputBinding:
position: 1
separate: true
shellQuote: true
streamable: false
type: File
input_2:
default:
class: File
path: ../../data/AB/1976/00_rawpdfs.tar.gz
inputBinding:
position: 2
separate: true
shellQuote: true
streamable: false
type: File
input_3:
default: data/AB/1976/02_extractedxml.tar.gz
inputBinding:
position: 3
separate: true
shellQuote: true
streamable: false
type: string
outputs:
output_0:
outputBinding:
glob: $(inputs.input_3)
streamable: false
type: File
permanentFailCodes: []
requirements:
- class: InlineJavascriptRequirement
- class: InitialWorkDirRequirement
listing:
- entry: '$({"listing": [], "class": "Directory"})'
entryname: data/AB/1976
writable: true
successCodes: []
temporaryFailCodes: []
File added
File added
File added
File added
File added
File added
File added
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment