# Clean up any previous build artifacts
rm -rf build/ dist/ *.egg-info/
# Build the package
python -m pip install --upgrade pip build
pip install --upgrade setuptools
python -m build
# Publish to PyPI (if needed)
python -m pip install --upgrade twine
python -m twine upload dist/*
python -m venv venv
source venv/bin/activate
Clean up the build artifacts and rebuild
rm -rf build/ dist/ src/text2doc.egg-info/
python -m pip install -e .
python -m build
text2doc
implements a virtual file system in memory. This module provides an interface compatible with the os
module and provides operations on files and directories stored in RAM rather than on disk.
pip install text2doc
from text2doc import text2doc
# Example usage
texts = ["This is a sample text.", "Another text to tokenize."]
tokenizer = YourTokenizer() # Replace with your tokenizer instance
docs = text2doc(texts, tokenizer)
print(docs)
rm -rf build/ dist/ *.egg-info/
python -m pip install --upgrade pip build
python -m build
python -m pip install --upgrade twine
python -m twine upload dist/*