Skip to content

Commit 9c14dab

Browse files
[Automatic] Update of the Catalog
1 parent d84d7bf commit 9c14dab

File tree

4 files changed

+588
-109
lines changed

4 files changed

+588
-109
lines changed

catalog.json

+241
Original file line numberDiff line numberDiff line change
@@ -12375,6 +12375,179 @@
1237512375
],
1237612376
"_pid": "1f8e04f53"
1237712377
},
12378+
"b69c3be91": {
12379+
"authors": [
12380+
{
12381+
"name": "Alix",
12382+
"orcid": "0000-0002-0136-4434",
12383+
"roles": [
12384+
"transcriber",
12385+
"project-manager",
12386+
"quality-control",
12387+
"support"
12388+
],
12389+
"surname": "Chagu\u00e9"
12390+
},
12391+
{
12392+
"name": "Julie",
12393+
"roles": [
12394+
"transcriber",
12395+
"quality-control"
12396+
],
12397+
"surname": "Ciss\u00e9"
12398+
},
12399+
{
12400+
"name": "Radia",
12401+
"roles": [
12402+
"transcriber",
12403+
"quality-control"
12404+
],
12405+
"surname": "Kichou"
12406+
}
12407+
],
12408+
"automatically-aligned": false,
12409+
"characters": {
12410+
"members": [
12411+
"e",
12412+
"a",
12413+
"s",
12414+
"r",
12415+
"n",
12416+
"t",
12417+
"i",
12418+
"u",
12419+
"l",
12420+
"o",
12421+
"d",
12422+
"p",
12423+
"c",
12424+
"m",
12425+
"\u0301",
12426+
"-",
12427+
"'",
12428+
"v",
12429+
",",
12430+
"\u0300",
12431+
"f",
12432+
"b",
12433+
"q",
12434+
"g",
12435+
"h",
12436+
".",
12437+
"A",
12438+
"x",
12439+
"j",
12440+
"P",
12441+
"L",
12442+
"1",
12443+
"E",
12444+
"\u0302",
12445+
"M",
12446+
"2",
12447+
"^",
12448+
"y",
12449+
"S",
12450+
"C",
12451+
"D",
12452+
"\u0327",
12453+
"J",
12454+
"T",
12455+
"z",
12456+
"R",
12457+
"I",
12458+
"G",
12459+
"9",
12460+
"F",
12461+
"\"",
12462+
"?",
12463+
";",
12464+
"!",
12465+
"N",
12466+
"4",
12467+
"0",
12468+
"U",
12469+
"5",
12470+
"B",
12471+
"(",
12472+
")",
12473+
"3",
12474+
"8",
12475+
"6",
12476+
"7",
12477+
"[",
12478+
"]",
12479+
"H",
12480+
"Q",
12481+
"k",
12482+
"=",
12483+
":",
12484+
"\u00d7",
12485+
"Y",
12486+
"\u27e6",
12487+
"\u27e7",
12488+
"O"
12489+
],
12490+
"mode": "NFD"
12491+
},
12492+
"citation-file-link": "https://github.com/alix-tz/dataset-celestine-doniau-danest/CITATION.cff",
12493+
"description": "Jeu de v\u00e9rit\u00e9s de terrain pour la transcription automatique produit avec eScriptorium dans le cadre du cours HNU2000 \u00e0 l\u2019Universit\u00e9 de Montr\u00e9al au trimestre d'automne 2024. Le jeu de donn\u00e9es contient des pages tir\u00e9es al\u00e9atoirement des num\u00e9risation du \"Journal de C\u00e9lestine Doniau-Danest sur les d\u00e9buts de la Guerre 1914-1918\" mis en ligne par les Archives d\u00e9partementales de la Somme. \n\n*Ground Truth dataset for automatic text recognition created with eScriptorium during the HNU 2000 course at the Universit\u00e9 de Montr\u00e9al during the Fall 2024 semester. The dataset contains pages taken randomly from the digitization of the \"Journal de C\u00e9lestine Doniau-Danest sur les d\u00e9buts de la Guerre 1914-1918\" (Diary of C\u00e9lestine Doniau-Danest on the beginning of the 1914-1918 war), published by the departmental archives of Somme.*",
12494+
"format": "Alto-XML",
12495+
"hands": {
12496+
"count": "1",
12497+
"precision": "exact"
12498+
},
12499+
"institutions": [],
12500+
"language": [
12501+
"fra"
12502+
],
12503+
"license": {
12504+
"name": "CC-BY 4.0",
12505+
"url": "https://creativecommons.org/licenses/by/4.0/"
12506+
},
12507+
"production-software": "eScriptorium + Kraken",
12508+
"project-name": "HNU2000@UdeM",
12509+
"schema": "https://htr-united.github.io/schema/2023-06-27/schema.json",
12510+
"script": [
12511+
{
12512+
"iso": "Latn"
12513+
}
12514+
],
12515+
"script-type": "only-manuscript",
12516+
"sources": [
12517+
{
12518+
"link": "https://archives.somme.fr/ark:/58483/tjrd8pq42716",
12519+
"reference": ""
12520+
}
12521+
],
12522+
"time": {
12523+
"notAfter": "1915",
12524+
"notBefore": "1914"
12525+
},
12526+
"title": "GT Celestine Doniau-Danest",
12527+
"transcription-guidelines": "De mani\u00e8re g\u00e9n\u00e9rale, les r\u00e8gles de transcription suivies sont immitatives. \n\n- Mots illisibles: durant la phase de transcription, les mots illisibles ont \u00e9t\u00e9 transcrits par \\[???\\]. Ils ont ensuite \u00e9t\u00e9 r\u00e9solus collectivement.\n- D\u00e9coration du texte: les d\u00e9corations comme le soulignage, etc, n'ont pas fait l'objet d'une transcription distincte du reste du texte.\n- Correction et normalisation: les fautes d'orthographes ont \u00e9t\u00e9 reproduites telles que dans la source, les espacements sont en revanche normalis\u00e9s selon l'usage moderne.\n- Ponctuation: \n - pour la transcription des points (.) et des tirets (-), on a respect\u00e9 le trac\u00e9\ndans la source plut\u00f4t que l'usage attendu car le trac\u00e9 de ces deux signes est tr\u00e8s distinct. \n - les signes de ponctuation double (:;?!) ne sont pas pr\u00e9c\u00e9d\u00e9 d'un espace.",
12528+
"url": "https://github.com/alix-tz/dataset-celestine-doniau-danest",
12529+
"volume": [
12530+
{
12531+
"count": 8024,
12532+
"metric": "characters"
12533+
},
12534+
{
12535+
"count": 4,
12536+
"metric": "files"
12537+
},
12538+
{
12539+
"count": 144,
12540+
"metric": "lines"
12541+
},
12542+
{
12543+
"count": 8,
12544+
"metric": "regions"
12545+
}
12546+
],
12547+
"_bibtex": "@misc{YourReferenceHere,\nauthor = {Chagu\u00e9, Alix and Ciss\u00e9, Julie and Kichou, Radia},\ntitle = {GT Celestine Doniau-Danest},\nurl = {https://archives.somme.fr/ark:/58483/tjrd8pq42716}\n}\n",
12548+
"_apa": "Chagu\u00e9 A., Ciss\u00e9 J., Kichou R. GT Celestine Doniau-Danest URL: https://archives.somme.fr/ark:/58483/tjrd8pq42716\n",
12549+
"_pid": "b69c3be91"
12550+
},
1237812551
"d26cd8486": {
1237912552
"schema": "https://htr-united.github.io/schema/2023-06-27/schema.json",
1238012553
"title": "Moonshines",
@@ -14511,6 +14684,74 @@
1451114684
"automatically-aligned": false,
1451214685
"_pid": "98985e96b"
1451314686
},
14687+
"9f3c75a3b": {
14688+
"schema": "https://htr-united.github.io/schema/2023-06-27/schema.json",
14689+
"title": "DISTINGUO : Ground truth for Handwritten Text Recognition (HTR) on Collections of Distinctions (late 13th to late 15th century) ",
14690+
"url": "https://nakala.fr/10.34847/nkl.48ad8b8d",
14691+
"authors": [
14692+
{
14693+
"name": "Svetlana",
14694+
"surname": "Yatsyk",
14695+
"orcid": "0000-0001-5356-7746",
14696+
"roles": [
14697+
"transcriber",
14698+
"aligner"
14699+
]
14700+
}
14701+
],
14702+
"institutions": [],
14703+
"description": "This dataset contains normalized transcriptions of collections of distinctions, specifically \"Summa de abstinentia\" by Nicolas of Biard and \"Dictionarium bovis\" by Thomas of Pavia. They were prepared as part of the DISTINGUO project, dedicated to the study of distinctiones in medieval Latin preaching and led by Marjorie Burghart in 2019-2024.",
14704+
"project-website": "https://distinguo.huma-num.fr/",
14705+
"language": [
14706+
"lat"
14707+
],
14708+
"production-software": "eScriptorium + Kraken",
14709+
"automatically-aligned": false,
14710+
"script": [
14711+
{
14712+
"iso": "Latn"
14713+
}
14714+
],
14715+
"script-type": "only-manuscript",
14716+
"time": {
14717+
"notBefore": "1250",
14718+
"notAfter": "1499"
14719+
},
14720+
"hands": {
14721+
"count": "1-per-folder",
14722+
"precision": "estimated"
14723+
},
14724+
"license": {
14725+
"name": "CC-BY 4.0",
14726+
"url": "https://creativecommons.org/licenses/by/4.0/"
14727+
},
14728+
"format": "Page-XML",
14729+
"sources": [
14730+
{
14731+
"reference": "Yatsyk, S. (2024). DISTINGUO : Ground truth for Handwritten Text Recognition (HTR) on Collections of Distinctions (late 13th to late 15th century) (Version 1) [Data set]. NAKALA - https://nakala.fr (Huma-Num - CNRS).",
14732+
"link": "https://doi.org/10.34847/NKL.48AD8B8D"
14733+
}
14734+
],
14735+
"volume": [
14736+
{
14737+
"metric": "lines",
14738+
"count": 15190
14739+
},
14740+
{
14741+
"metric": "characters",
14742+
"count": 682486
14743+
},
14744+
{
14745+
"metric": "regions",
14746+
"count": 1076
14747+
},
14748+
{
14749+
"metric": "pages",
14750+
"count": 318
14751+
}
14752+
],
14753+
"_pid": "9f3c75a3b"
14754+
},
1451414755
"1dd38d4a3": {
1451514756
"schema": "https://htr-united.github.io/schema/2023-06-27/schema.json",
1451614757
"title": "Ground truth for Neue Z\u00fcrcher Zeitung black letter period",

graph.png

1.17 KB
Loading

0 commit comments

Comments
 (0)