Documentation updates

gbenson · gbenson · commit e5992190a65b · 2024-05-16T01:03:36.000+01:00
diff --git a/README.md b/README.md
@@ -1,8 +1,25 @@
+<p style="float: right">
+    <a href="https://badge.fury.io/py/dom-tokenizers">
+         <img alt="Build" src="https://badge.fury.io/py/dom-tokenizers.svg">
+    </a>
+    <a href="https://github.com/gbenson/dom-tokenizers/blob/master/LICENSE">
+        <img alt="GitHub" src="https://img.shields.io/github/license/gbenson/dom-tokenizers.svg?color=blue">
+    </a>
+</p>
+
 # DOM tokenizers
 
-HTML DOM-aware tokenizers for Hugging Face language models.
+DOM-aware tokenizers for [🤗 Hugging Face](https://huggingface.co/)
+language models.
+
+## Installation
+
+### With PIP
+```sh
+pip install dom-tokenizers[train]
+```
 
-## Setup for development
+### From sources
 
 ```sh
 git clone https://github.com/gbenson/dom-tokenizers.git
diff --git a/pyproject.toml b/pyproject.toml
@@ -2,15 +2,21 @@
 name = "dom-tokenizers"
 version = "0.0.1"
 authors = [{ name = "Gary Benson" }]
-description = "HTML DOM-aware tokenizers for Hugging Face language models"
+description = "DOM-aware tokenizers for Hugging Face language models"
 readme = "README.md"
-license = { file = "LICENSE" }
+license = { text = "Apache Software License (Apache-2.0)" }
 requires-python = ">=3.10"  # match..case
 classifiers = [
-    "Programming Language :: Python :: 3",
+    "Development Status :: 4 - Beta",
+    "Intended Audience :: Developers",
+    "Intended Audience :: Education",
+    "Intended Audience :: Science/Research",
     "License :: OSI Approved :: Apache Software License",
     "Operating System :: OS Independent",
-    "Development Status :: 4 - Beta",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
     "Topic :: Internet :: WWW/HTTP",
     "Topic :: Software Development :: Libraries",
     "Topic :: Scientific/Engineering :: Artificial Intelligence",
@@ -25,8 +31,7 @@ dependencies = [
 
 [project.urls]
 Homepage = "https://github.com/gbenson/dom-tokenizers"
-Repository = "https://github.com/gbenson/dom-tokenizers"
-"Bug Tracker" = "https://github.com/gbenson/dom-tokenizers/issues"
+#Source = "https://github.com/gbenson/dom-tokenizers"
 
 [project.optional-dependencies]
 dev = [