diff --git a/badges/characters.svg b/badges/characters.svg
index 06efa7b..5cc7ac1 100644
--- a/badges/characters.svg
+++ b/badges/characters.svg
@@ -17,7 +17,7 @@
Characters
- 399155
- 399155
+ 131511
+ 131511
-
\ No newline at end of file
+
diff --git a/badges/files.svg b/badges/files.svg
index 2bc2681..9d6a746 100644
--- a/badges/files.svg
+++ b/badges/files.svg
@@ -17,7 +17,7 @@
XML Files
- 150
- 150
+ 151
+ 151
-
\ No newline at end of file
+
diff --git a/badges/lines.svg b/badges/lines.svg
index 4e572ec..cca1c1d 100644
--- a/badges/lines.svg
+++ b/badges/lines.svg
@@ -17,7 +17,7 @@
Lines
- 4115
- 4115
+ 4376
+ 4376
-
\ No newline at end of file
+
diff --git a/badges/regions.svg b/badges/regions.svg
index f8db9d0..d5967cb 100644
--- a/badges/regions.svg
+++ b/badges/regions.svg
@@ -17,7 +17,7 @@
Regions
- 150
- 150
+ 375
+ 375
-
\ No newline at end of file
+
diff --git a/htr-united.yml b/htr-united.yml
index e1431cc..06c5161 100644
--- a/htr-united.yml
+++ b/htr-united.yml
@@ -1,92 +1,138 @@
-schema: https://htr-united.github.io/schema/2022-04-15/schema.json
-title: Tapus Corpus
-url: https://github.com/HTR-United/tapuscorpus
-project-name: 'HTR-United
-
- '
-project-website: https://htr-united.github.io/
authors:
-- name: "Chagu\xE9"
- surname: Alix
+- name: Chagué
roles:
- transcriber
- project-manager
-description: Ground truth based on a variety of French typewritten documents from
- the 20th century. Contains exerpts plays, poems, letters and administrative reports.
-language:
-- fra
-script:
-- iso: Latn
-script-type: only-typed
-time:
- notBefore: '1900'
- notAfter: '1999'
-hands:
- count: 1-per-folder
- precision: exact
-license:
-- name: CC-BY 4.0
- url: https://creativecommons.org/licenses/by/4.0/
-format: Page-XML
-volume:
-- metric: characters
- count: 399155
-- metric: files
- count: 150
-- metric: lines
- count: 4115
-- metric: pages
- count: 150
-- metric: regions
- count: 150
-sources:
-- reference: "Chagu\xE9, A. (2021). Tapuscorpus (Version 1.0) [Computer software].\
- \ https://doi.org/10.5072/zenodo.977649"
- link: ''
-citation-file-link: https://github.com/HTR-United/tapuscorpus/raw/main/citation.cff
-transcription-guidelines: See README in repository.
-production-software: eScriptorium + Kraken
+ surname: Alix
characters:
- mode: NFD
members:
- e
- - t
- - /
- - '0'
- a
- - c
+ - s
- n
+ - t
- r
- - '7'
- - m
- - h
- - p
- - s
+ - i
+ - u
- o
- - g
- - '4'
+ - l
- d
- - '1'
- - E
+ - c
+ - m
+ - p
+ - ́
- .
- - i
+ - '~'
+ - v
+ - ','
+ - "'"
- '-'
- - '2'
- - '9'
- - '5'
- f
- - <
- - l
- - '{'
- - ':'
- - P
+ - g
+ - h
+ - q
+ - b
+ - ̀
+ - _
+ - E
+ - L
- A
- - G
- - '}'
- - U
+ - I
+ - C
- x
- - '>'
- - b
- - '8'
+ - S
+ - M
+ - j
+ - T
+ - ̂
+ - R
+ - N
+ - '1'
+ - O
+ - P
+ - y
+ - '"'
+ - U
+ - J
+ - D
+ - '2'
+ - ':'
+ - )
+ - (
+ - B
+ - '0'
+ - '5'
- '3'
+ - '4'
+ - z
- '6'
+ - F
+ - H
+ - Q
+ - '!'
+ - '9'
+ - G
+ - '7'
+ - V
+ - '8'
+ - '?'
+ - ⟦
+ - ⟧
+ - ̧
+ - Y
+ - ;
+ - ’
+ - °
+ - k
+ - X
+ - ̈
+ - +
+ - '='
+ - W
+ - /
+ - K
+ - ^
+ - w
+ - Z
+ - '%'
+ - '*'
+ mode: NFD
+citation-file-link: https://github.com/HTR-United/tapuscorpus/raw/main/citation.cff
+description: Ground truth based on a variety of French typewritten documents from
+ the 20th century. Contains exerpts plays, poems, letters and administrative reports.
+format: Page-XML
+hands:
+ count: 1-per-folder
+ precision: exact
+language:
+- fra
+license:
+- name: CC-BY 4.0
+ url: https://creativecommons.org/licenses/by/4.0/
+production-software: eScriptorium + Kraken
+project-name: "HTR-United\n"
+project-website: https://htr-united.github.io/
+schema: https://htr-united.github.io/schema/2022-04-15/schema.json
+script:
+- iso: Latn
+script-type: only-typed
+sources:
+- link: ''
+ reference: Chagué, A. (2021). Tapuscorpus (Version 1.0) [Computer software]. https://doi.org/10.5072/zenodo.977649
+time:
+ notAfter: '1999'
+ notBefore: '1900'
+title: Tapus Corpus
+transcription-guidelines: See README in repository.
+url: https://github.com/HTR-United/tapuscorpus
+volume:
+- count: 131511
+ metric: characters
+- count: 151
+ metric: files
+- count: 4376
+ metric: lines
+- count: 150
+ metric: pages
+- count: 375
+ metric: regions