Character encoding detecting library for Python using ICU and libmagic. Inspired by Charlock Holmes
- icu
- file(libmagic)
emerge -av dev-libs/icu
emerge -av sys-apps/file
apt-get install libicu-dev
apt-get install libmagic-dev
brew install icu4c
brew install libmagic
export ICUI18N="/usr/local/Cellar/icu4c/xx" # Replace "xx" as the version of your icu
export MAGIC="/usr/local/Cellar/libmagic/xx" # Replace "xx" as the version of your libmagic
python setup build
python setup install
from charlockholmes import detect
file = open('test.txt')
content = file.read()
print detect(content)
- 0.0.3
- Add support for python 3.X
Modified BSD License