-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathproject.lock
161 lines (161 loc) · 5 KB
/
project.lock
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
convert:
cmd: python -m spacy run convert
script:
- python scripts/convert_ner.py en assets/ner_train.jsonl corpus/ner_train.spacy
- python scripts/convert_ner.py en assets/ner_valid.jsonl corpus/ner_valid.spacy
- python scripts/convert_senter.py en assets/senter_train.jsonl corpus/senter_train.spacy
- python scripts/convert_senter.py en assets/senter_valid.jsonl corpus/senter_valid.spacy
deps:
- path: assets/ner_train.jsonl
md5: e0fb3b0f4c99bc103c166028338f1b6a
- path: assets/ner_valid.jsonl
md5: c20910505436b1577657da1169bab36b
- path: assets/senter_train.jsonl
md5: f6a06405e874c4acd9374c2072b4be83
- path: assets/senter_valid.jsonl
md5: 6f3c0f29f54529747f597711cac22201
- path: scripts/convert_ner.py
md5: 9004e1545bc07e1ee00c85ca016e0afe
- path: scripts/convert_senter.py
md5: b84ab83edabae8f7de6ce8e5892ac180
outs:
- path: corpus/ner_train.spacy
md5: 0c384c2eb7d649b68ba4fedb55c885c4
- path: corpus/ner_valid.spacy
md5: 46e203020f092d82f3e9743c64a770e7
- path: corpus/senter_train.spacy
md5: 8f57d827f72b404f11620cbff36e730c
- path: corpus/senter_valid.spacy
md5: c9197d0564c527442f4eff4c8df0a88f
spacy_version: 3.2.3
spacy_git_version: 99425de36
create-config:
cmd: python -m spacy run create-config
script:
- python -m spacy init config --lang en --pipeline ner configs/config.cfg --force
deps: []
outs:
- path: configs/config.cfg
md5: 89958efd9faccb2e4374ae2544ebd215
spacy_version: 3.2.3
spacy_git_version: 99425de36
train:
cmd: python -m spacy run train
script:
- python -m spacy train configs/config.cfg --output training/ --gpu-id -1 --initialize.vectors
en_core_web_lg --components.tok2vec.model.embed.include_static_vectors true
deps:
- path: configs/config.cfg
md5: cc5e771dda6199a127ad272bf9e02c42
- path: corpus/train.spacy
md5: 4dac9cdea512c17a4c63671dec08bafa
- path: corpus/dev.spacy
md5: b8eba5abc5f9abb957d8242bd540c2c8
outs:
- path: training/model-best
md5: ec595899e24fc4d212adc09f3ed46801
spacy_version: 3.2.3
spacy_git_version: 99425de36
evaluate:
cmd: python -m spacy run evaluate
script:
- python -m spacy evaluate training/model-best corpus/dev.spacy --output training/metrics.json
deps:
- path: corpus/dev.spacy
md5: b8eba5abc5f9abb957d8242bd540c2c8
- path: training/model-best
md5: ec595899e24fc4d212adc09f3ed46801
outs:
- path: training/metrics.json
md5: 29cab9e69b7e18eb48e17aeb690e5a69
spacy_version: 3.2.3
spacy_git_version: 99425de36
partition:
cmd: python -m spacy run partition
script:
- python scripts/partition.py assets/ecfr_ner.jsonl assets/ner_train.jsonl assets/ner_valid.jsonl
- python scripts/partition.py assets/ecfr_sents.jsonl assets/senter_train.jsonl
assets/senter_valid.jsonl
deps: []
outs: []
spacy_version: 3.2.3
spacy_git_version: 99425de36
download:
cmd: python -m spacy run download
script:
- python -m spacy download en_core_web_lg
deps: []
outs: []
spacy_version: 3.2.3
spacy_git_version: 99425de36
train-senter:
cmd: python -m spacy run train-senter
script:
- prodigy train senter --senter ecfr_labeled_sents
deps: []
outs: []
spacy_version: 3.2.3
spacy_git_version: 99425de36
clean:
cmd: python -m spacy run clean
script:
- rm -rf training
- rm -rf corpus
- rm -rf packages
deps: []
outs: []
spacy_version: 3.2.3
spacy_git_version: 99425de36
data-to-spacy:
cmd: python -m spacy run data-to-spacy
script:
- python -m prodigy data-to-spacy corpus/ --senter ecfr_labeled_sents --ner ecfr_labeled_ner
deps: []
outs:
- path: corpus/train.spacy
md5: 4dac9cdea512c17a4c63671dec08bafa
- path: corpus/dev.spacy
md5: b8eba5abc5f9abb957d8242bd540c2c8
spacy_version: 3.2.3
spacy_git_version: 99425de36
data-to-asset-senter:
cmd: python -m spacy run data-to-asset-senter
script:
- python -m prodigy db-out ecfr_labeled_sents assets/ecfr_senter_labels.jsonl
deps: []
outs:
- path: assets
md5: 6e226cca080f5c11630c76cf9912741a
spacy_version: 3.2.3
spacy_git_version: 99425de36
data-to-asset-ner:
cmd: python -m spacy run data-to-asset-ner
script:
- python -m prodigy db-out ecfr_initial_ner assets/ecfr_ner_labels.jsonl
deps: []
outs:
- path: assets
md5: 24e816efd133f3c42d9f466b00badee5
spacy_version: 3.2.3
spacy_git_version: 99425de36
document:
cmd: python -m spacy run document
script:
- spacy project document --output README.md
deps: []
outs: []
spacy_version: 3.2.3
spacy_git_version: 99425de36
package:
cmd: python -m spacy run package
script:
- python -m spacy package training/model-best packages --name ecfr_ner --version
0.1.0 --force
deps:
- path: training/model-best
md5: ec595899e24fc4d212adc09f3ed46801
outs:
- path: packages/en_ecfr_ner-0.1.0/dist/en_ecfr_ner-0.1.0.tar.gz
md5: cc0778ab709aa15aff1a76ea3d8e45e3
spacy_version: 3.2.3
spacy_git_version: 99425de36