<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="//www.frenchcorpus.com/main-sitemap.xsl"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd http://www.google.com/schemas/sitemap-image/1.1 http://www.google.com/schemas/sitemap-image/1.1/sitemap-image.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
	<url>
		<loc>https://www.frenchcorpus.com/building-an-audit-ready-provenance-trail-for-training-datasets/</loc>
		<lastmod>2026-05-13T20:14:40+00:00</lastmod>
	</url>
	<url>
		<loc>https://www.frenchcorpus.com/training-data-size-for-llms-how-many-tokens-do-you-actually-need-in-2026/</loc>
		<lastmod>2026-05-13T20:14:39+00:00</lastmod>
	</url>
	<url>
		<loc>https://www.frenchcorpus.com/eu-ai-act-article-10-what-training-data-documentation-actually-requires/</loc>
		<lastmod>2026-05-13T20:14:39+00:00</lastmod>
	</url>
	<url>
		<loc>https://www.frenchcorpus.com/sft-datasets-format-structure-and-instruction-tuning-best-practices/</loc>
		<lastmod>2026-05-13T20:14:38+00:00</lastmod>
	</url>
	<url>
		<loc>https://www.frenchcorpus.com/choosing-a-dataset-format-parquet-vs-jsonl-vs-arrow-for-ml-pipelines/</loc>
		<lastmod>2026-05-13T20:14:38+00:00</lastmod>
	</url>
	<url>
		<loc>https://www.frenchcorpus.com/how-to-create-a-training-dataset-for-object-detection/</loc>
		<lastmod>2026-05-13T20:14:37+00:00</lastmod>
	</url>
	<url>
		<loc>https://www.frenchcorpus.com/how-to-train-an-llm-on-your-own-data-a-practical-2026-guide/</loc>
		<lastmod>2026-05-13T20:14:37+00:00</lastmod>
	</url>
</urlset>
<!-- XML Sitemap generated by Rank Math SEO Plugin (c) Rank Math - rankmath.com -->