This small extension provides bindings to use the Chromium Compact Language Detector (http://code.google.com/p/chromium-compact-language-detector/) in PHP.
- Checkout Chromium Language Detector from with
hg clone https://code.google.com/p/chromium-compact-language-detector
- Run
./build.sh
- Checkout this project
- Run
phpize && ./configure --with-libcld-dir=... && make && sudo make install
- Add
extension=cld.so
to yourphp.ini
<?php
var_export(CLD\detect("Drüben hinterm Dorfe wohnt ein Leiermann. Und mit starren Fingern spielt er was er kann"));
var_export(CLD\detect("日[の]本([の]国", false, true, null, CLD\Language::JAPANESE, CLD\Encoding::JAPANESE_EUC_JP));
<?php
$detector = new CLD\Detector();
var_export($detector->detect('Drüben hinterm Dorfe wohnt ein Leiermann. Und mit starren Fingern spielt er was er kann'));
$detector->setLanguageHint(CLD\Language::JAPANESE);
$detector->setEncodingHint(CLD\Encoding::JAPANESE_EUC_JP);
$detector->detect("日[の]本([の]国", false);
will return
array (
0 =>
array (
'name' => 'GERMAN',
'code' => 'de',
'reliable' => true,
'bytes' => 90,
),
)
array (
0 =>
array (
'name' => 'JAPANESE',
'code' => 'ja',
'reliable' => true,
'bytes' => 22,
),
1 =>
array (
'name' => 'CHINESE',
'code' => 'zh',
'reliable' => true,
'bytes' => 22,
),
)