-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhtr-united.yml
172 lines (172 loc) · 2.04 KB
/
htr-united.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
authors:
- name: Chagué
roles:
- transcriber
- aligner
- support
surname: Alix
- name: Riondet
roles:
- support
surname: Charles
- name: Le Fourner
roles:
- transcriber
surname: Victoria
- name: Bey
roles:
- transcriber
surname: Laura
- name: Vanneau
roles:
- transcriber
surname: Laurie
- name: Skilbeck-Gaborit
roles:
- transcriber
surname: Eden
- name: Meissel
roles:
- transcriber
surname: Nina
- name: Genero
roles:
- aligner
surname: Jean-Damien
- name: Champougny
roles:
- transcriber
surname: Kevin
- name: Albert
roles:
- project-manager
surname: Anaïs
- name: Martini
roles:
- project-manager
surname: Manuela
characters:
members:
- e
- n
- a
- i
- t
- r
- u
- s
- l
- o
- d
- p
- c
- m
- ́
- v
- f
- q
- x
- ̀
- ','
- g
- h
- "'"
- ;
- j
- C
- b
- P
- D
- ’
- y
- B
- .
- L
- M
- ̂
- z
- J
- A
- G
- E
- '-'
-
- S
- V
- '?'
- T
- Q
- F
- '='
- R
- '4'
- '2'
- ̧
- k
- —
- '7'
- W
- O
- N
- '1'
- '3'
- '8'
- '0'
- '9'
- ':'
- –
- '5'
- ̈
- Y
- K
- H
- œ
- I
- )
- (
- U
- Z
- _
- '@'
- '!'
- ‘
- »
- '&'
- '6'
- ─
- /
mode: NFD
description: Ground-Truth for French 19th century pre-printed documents created by
administrative services.
format: Page-XML
hands:
count: less-than-11
precision: estimated
language:
- fra
license:
- name: CC-BY 4.0
url: https://creativecommons.org/licenses/by/4.0/
production-software: eScriptorium + Kraken
project-name: ANR TIME US
project-website: https://timeus.hypotheses.org/
schema: https://htr-united.github.io/schema/2022-04-15/schema.json
script:
- iso: Latn
script-type: evenly-mixed
time:
notAfter: '1858'
notBefore: '1858'
title: TIMEUS Corpus
url: https://github.com/HTR-United/timeuscorpus
volume:
- count: 401304
metric: characters
- count: 250
metric: files
- count: 7701
metric: lines
- count: 159
metric: pages
- count: 586
metric: regions