Skip to content
3 changes: 3 additions & 0 deletions SIS/clarin/data/formats/fCSV.xml
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,8 @@
<keyword>tabular format</keyword>
<keyword type="SSO">W3C</keyword>
<extId type="LOC">fdd000323</extId>
<extDoc type="enWiki">Comma-separated_values</extDoc>
<extDoc type="formatWiki">CSV</extDoc>
<info type="description">
<p>"CSV is one of the most popular formats for publishing data on the web. It is concise, easy
to understand by both humans and computers, and aligns nicely to the tabular nature of most
Expand Down Expand Up @@ -38,6 +40,7 @@
<li><a href="https://specs.frictionlessdata.io/csv-dialect/">CSV Dialect</a> -- a set of modelling parameters for describing various dialects of CSV</li>
</ul>
</info>
<relation target="tabularDataSpec" type="isDefinedBy"/>
<mimeType>text/csv</mimeType>
<fileExt>.csv</fileExt>
<formatFamily>Plain.Delimited</formatFamily>
Expand Down
10 changes: 7 additions & 3 deletions SIS/clarin/data/formats/fDICOM.xml
Original file line number Diff line number Diff line change
Expand Up @@ -11,16 +11,20 @@
<!-- this is also video, and can be lossy... messy -->
<extId type="Wikidata">Q28205908</extId>
<extId type="PRONOM">fmt/574</extId>
<extDoc type="enWiki">DICOM</extDoc>
<extDoc type="formatWiki">DICOM</extDoc>
<info type="description">
<p>See <a href="https://en.wikipedia.org/wiki/DICOM">https://en.wikipedia.org/wiki/DICOM</a>.</p>
<p>Please feel welcome to supply the description of this format file via GitHub: either as an
<a href="https://github.com/clarin-eric/standards/issues">issue report</a>, or as a pull
request after forking or browsing the
<a href="https://github.com/clarin-eric/standards/tree/formats/SIS/clarin/data/formats">code under the 'formats' branch</a>.</p>
<!-- Many image compression formats possible, https://en.wikipedia.org/wiki/DICOM -->
<p>Standardised both by ISO (ISO 12052) and NEMA (National Electrical Manufacturers
Association). (The standards relation link looks weird pending work on the proper visualisation.
Feel welcome to join us.)</p>
</info>
<!--<relation target="SpecDICOM" type="isDefinedBy"/>
ISO 12052, also own committe, and the primary standards body seems to be the NEMA: National Electrical Manufacturers Association
<relation target="SpecDICOM" type="isDefinedBy"/>
<!-- ISO 12052, also own committee, and the primary standards body seems to be the NEMA: National Electrical Manufacturers Association
-->
<mimeType>application/dicom</mimeType>
<fileExt recommended="yes">.dcm</fileExt>
Expand Down
1 change: 1 addition & 0 deletions SIS/clarin/data/formats/fODF.xml
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
<keyword>umbrella format</keyword>
<keyword type="SSO">OASIS</keyword>
<extId type="LOC">fdd000247</extId>
<extDoc type="enWiki">OpenDocument</extDoc>
<info type="description" umbrella="yes">
<p>"The Open Document Format for Office Applications (ODF), also known as OpenDocument, standardized as ISO 26300, is an open
file format for word processing documents, spreadsheets, presentations and graphics and using ZIP-compressed XML files.
Expand Down
1 change: 1 addition & 0 deletions SIS/clarin/data/formats/fTextPlain.xml
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@
<keyword>text format</keyword>
<!-- what other keywords should we add here? -->
<extDoc type="enWiki">Plain_text</extDoc>
<extDoc type="formatWiki">Plain_text</extDoc>
<info type="description">
<p>Plain text is a pure sequence of character codes. (...) Plain text represents character
content only, not its appearance. (...) Plain text must contain enough information to permit
Expand Down
30 changes: 17 additions & 13 deletions SIS/clarin/data/recommendations/CLARIN.SI-recommendation.xml
Original file line number Diff line number Diff line change
Expand Up @@ -2,29 +2,29 @@
<?xml-model href="../../schemas/recommendation.xsd" type="application/xml" schematypens="http://purl.oclc.org/dsdl/schematron"?>
<recommendation xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../../schemas/recommendation.xsd">
<header>
<lastUpdateCommitID>d4ad73e931b56f907716917299724fce4466f996</lastUpdateCommitID>
<lastUpdateCommitID>7ba3aad1a1f81b45e0ed3c53191b741701b48a42</lastUpdateCommitID>
<filter>
<centreID>CLARIN.SI</centreID>
</filter>
<respStmt>
<name>Jakob Lenardič</name>
<resp><!--optionally specify the range of responsibility; useful if multiple respStmt are used--></resp>
<link>https://github.com/jakoble</link>
<reviewDate>2025-04-14</reviewDate>
<reviewDate>2026-06-19</reviewDate>
</respStmt>
<centre id="CLARIN.SI" deposition="1">
<centreName>CLARIN.SI Language Technology Centre, Slovenia</centreName>
<registryLink registry="CLARIN" uri="https://centres.clarin.eu/centre/30"/>
<nodeInfo>
<ri status="B-centre">CLARIN</ri>
</nodeInfo>
<centre id="CLARIN.SI" deposition="1">
<centreName>CLARIN.SI Language Technology Centre, Slovenia</centreName>
<registryLink registry="CLARIN" uri="https://centres.clarin.eu/centre/30"/>
<nodeInfo>
<ri status="B-centre">CLARIN</ri>
</nodeInfo>
</centre>
</header>
</header>
<info>
<p>This page lists the file formats which are recommended for depositing in CLARIN.SI.
For additional information, see <a href="https://www.clarin.si/repository/xmlui/page/data">https://www.clarin.si/repository/xmlui/page/data</a>.</p>
<p>For details on the preservation policy of CLARIN.SI,
see <a href="https://www.clarin.si/repository/xmlui/page/about#preservation-policy">https://www.clarin.si/repository/xmlui/page/about#preservation-policy</a>.</p>
<p>This page lists the file formats which are recommended for depositing in CLARIN.SI. For additional information, see
<a href="https://www.clarin.si/repository/xmlui/page/data">https://www.clarin.si/repository/xmlui/page/data</a>.</p>
<p>For details on the preservation policy of CLARIN.SI, see
<a href="https://www.clarin.si/repository/xmlui/page/about#preservation-policy">https://www.clarin.si/repository/xmlui/page/about#preservation-policy</a>.</p>
</info>
<formats>
<format id="fEXB">
Expand Down Expand Up @@ -179,6 +179,10 @@
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fePub">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fEAF">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
Expand Down
79 changes: 23 additions & 56 deletions SIS/clarin/data/recommendations/ILC4CLARIN-recommendation.xml
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
<?xml-model href="../../schemas/recommendation.xsd" type="application/xml" schematypens="http://purl.oclc.org/dsdl/schematron"?>
<recommendation xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="../../schemas/recommendation.xsd">
<header>
<lastUpdateCommitID>147cb5ea659a5752efd819898b43da23e00c6a77</lastUpdateCommitID>
<lastUpdateCommitID>88fa1a1f69809fa389ab2c59a19bdf0a5ecc3f25</lastUpdateCommitID>
<filter>
<centreID>ILC4CLARIN</centreID>
</filter>
Expand All @@ -20,81 +20,48 @@
</nodeInfo>
</centre>
</header>
<info><!--use p, ul, ol elements here--></info>
<info><p>Formats extracted from the uploaded dataset and matched against
CLARIN Standards recommendations.</p>
<p>This list has been submitted by Riccardo Del Gratta in May 2026.</p>
<p>No active curator has yet been appointed for the recommendations.</p></info>
<formats>
<format id="fMOV">
<domain>Audiovisual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fMPEG1">
<domain>Audiovisual Source Language Data</domain>
<format id="fXML">
<domain>Metadata</domain>
<level>recommended</level>
</format>
<format id="fWAVE">
<domain>Audiovisual Source Language Data</domain>
<format id="fTXT">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fHTML">
<domain>Documentation</domain>
<format id="fCSV">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fLaTeX">
<format id="fRTF">
<domain>Documentation</domain>
<level>recommended</level>
<level>acceptable</level>
</format>
<format id="fPDF">
<domain>Documentation</domain>
<level>acceptable</level>
</format>
<format id="fTeX">
<domain>Documentation</domain>
<level>recommended</level>
</format>
<format id="fXML">
<domain>Documentation</domain>
<level>recommended</level>
</format>
<format id="fGIF">
<domain>Image Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fJPEG">
<domain>Image Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fTIFF">
<domain>Image Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fRDFXML">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fXML">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fODT">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fPDF">
<format id="fDOCX">
<domain>Textual Source Language Data</domain>
<level>acceptable</level>
</format>
<format id="fTextPlain">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
<format id="fXLSX">
<domain>Metadata</domain>
<level>acceptable</level>
</format>
<format id="fCSS">
<domain>Tool Support</domain>
<level>recommended</level>
<format id="fPPTX">
<domain>Documentation</domain>
<level>acceptable</level>
</format>
<format id="fGZIP">
<format id="fZIP">
<domain>Packaging</domain>
<level>recommended</level>
<level>acceptable</level>
</format>
<format id="fZIP">
<format id="fGZIP">
<domain>Packaging</domain>
<level>recommended</level>
</format>
Expand Down
35 changes: 25 additions & 10 deletions SIS/clarin/data/recommendations/INT-recommendation.xml
Original file line number Diff line number Diff line change
Expand Up @@ -2,15 +2,15 @@
<recommendation xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:noNamespaceSchemaLocation="../../schemas/recommendation.xsd">
<header>
<lastUpdateCommitID>0378aa7b9c8cd3f73e822dccf09dccf0b3a3ff01</lastUpdateCommitID>
<lastUpdateCommitID>7b0200bfcbc0b0dda978e5eab59859cd913b7658</lastUpdateCommitID>
<filter>
<centreID>INT</centreID>
</filter>
<respStmt>
<name>Griet Depoorter</name>
<resp/>
<link>mailto:griet.depoorter@ivdnt.org</link>
<reviewDate>2025-04-15</reviewDate>
<reviewDate>2026-05-26</reviewDate>
</respStmt>
<centre id="INT" deposition="1">
<centreName>Instituut voor de Nederlandse Taal (Dutch Language Institute) </centreName>
Expand All @@ -35,14 +35,14 @@
href="https://portal.clarin.ivdnt.org/information-about-deposition.html">here </a>
</p>
</info>
<formats>
<formats>
<format id="fDOCX">
<domain>Textual Source Language Data</domain>
<level>acceptable</level>
<level>discouraged</level>
</format>
<format id="fDOCX">
<domain>Documentation</domain>
<level>recommended</level>
<level>acceptable</level>
</format>
<format id="fXLSX">
<domain>Lexical Resource</domain>
Expand Down Expand Up @@ -301,17 +301,32 @@
<level>recommended</level>
</format>
<format id="fXHTML">
<domain>Contextual Data</domain>
<level>recommended</level>
</format>
<format id="fNIF">
<domain>Text Annotation</domain>
<level>acceptable</level>
</format>
<format id="fCoNLL-U">
<domain>Text Annotation</domain>
<level>recommended</level>
</format>
<format id="fCoNLL-U">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fXHTML">
<domain>Documentation</domain>
<format id="fFoLiA">
<domain>Textual Source Language Data</domain>
<level>recommended</level>
</format>
<format id="fNIF">
<domain>Text Annotation</domain>
<format id="fTeX">
<domain>Textual Source Language Data</domain>
<level>acceptable</level>
</format>

<format id="fTEISpoken">
<domain>Audiovisual Annotation</domain>
<level>recommended</level>
</format>
</formats>
</recommendation>