<?php
/* -*- tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
# ***** BEGIN LICENSE BLOCK *****
# This file is part of Plume Framework, a simple PHP Application Framework.
# Copyright (C) 2001-2007 Loic d'Anterroches and contributors.
#
# Plume Framework is free software; you can redistribute it and/or modify
# it under the terms of the GNU Lesser General Public License as published by
# the Free Software Foundation; either version 2.1 of the License, or
# (at your option) any later version.
#
# Plume Framework is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
#
# ***** END LICENSE BLOCK ***** */
class Pluf_Tests_Text_Lang extends UnitTestCase {
function __construct()
{
parent::__construct('Test the language detection.');
}
function testNGrams()
{
$n = Pluf_Text_Lang::docNgrams('test the language detection with a simple string this file is part of plume framework a simple php application framework');
$this->assertEqual(count($n), 128);
}
function testNGramsDist()
{
$n1 = Pluf_Text_Lang::docNgrams('test the language detection with a simple string this file is part of plume framework a simple php application framework');
$n2 = Pluf_Text_Lang::docNgrams('teste la detection de la langue avec une simple chaine ce fichier fait partie de plume framework un framework simple de developpement d applications en php');
$n3 = Pluf_Text_Lang::docNgrams('test the this file is part of plume framework a simple php application framework language detection with a simple string');
$this->assertEqual(0, Pluf_Text_Lang::ngramDistance($n1, $n3));
$this->assertEqual(Pluf_Text_Lang::ngramDistance($n1, $n2),
Pluf_Text_Lang::ngramDistance($n3, $n2));
}
}