wikimedia/mediawiki-core

View on GitHub
includes/language/converters/ShiConverter.php

Summary

Maintainability
C
1 day
Test Coverage
<?php
/**
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
 * http://www.gnu.org/copyleft/gpl.html
 *
 * @file
 */

/**
 * Shilha specific code.
 *
 * Conversion script between Latin and Tifinagh for Tachelhit.
 * - Tifinagh -> lowercase Latin
 * - lowercase/uppercase Latin -> Tifinagh
 *
 *
 * Based on:
 *   - https://en.wikipedia.org/wiki/Shilha_language
 *   - LanguageSr.php
 *
 * @ingroup Languages
 */
class ShiConverter extends LanguageConverterSpecific {
    /**
     * The Tifinagh alphabet sequence is based on
     * "Dictionnaire Général de la Langue Amazighe Informatisé"
     * by IRCAM (https://tal.ircam.ma/dglai/lexieam.php, DGLAi),
     * with the labio-velarization mark in the end
     */
    private const TO_LATIN = [
        'ⴰ' => 'a',
        'ⴱ' => 'b',
        'ⴳ' => 'g',
        'ⴷ' => 'd',
        'ⴹ' => 'ḍ',
        'ⴻ' => 'e',
        'ⴼ' => 'f',
        'ⴽ' => 'k',
        'ⵀ' => 'h',
        'ⵃ' => 'ḥ',
        'ⵄ' => 'ɛ',
        'ⵅ' => 'x',
        'ⵇ' => 'q',
        'ⵉ' => 'i',
        'ⵊ' => 'j',
        'ⵍ' => 'l',
        'ⵎ' => 'm',
        'ⵏ' => 'n',
        'ⵓ' => 'u',
        'ⵔ' => 'r',
        'ⵕ' => 'ṛ',
        'ⵖ' => 'ɣ',
        'ⵙ' => 's',
        'ⵚ' => 'ṣ',
        'ⵛ' => 'c',
        'ⵜ' => 't',
        'ⵟ' => 'ṭ',
        'ⵡ' => 'w',
        'ⵢ' => 'y',
        'ⵣ' => 'z',
        'ⵥ' => 'ẓ',
        'ⵯ' => 'ʷ',
    ];

    /** The sequence is based on DGLAi, with the non-standard letters in the end */
    private const UPPER_TO_LOWER_CASE_LATIN = [
        'A' => 'a',
        'B' => 'b',
        'G' => 'g',
        'D' => 'd',
        'Ḍ' => 'ḍ',
        'E' => 'e',
        'F' => 'f',
        'K' => 'k',
        'H' => 'h',
        'Ḥ' => 'ḥ',
        'Ɛ' => 'ɛ',
        'X' => 'x',
        'Q' => 'q',
        'I' => 'i',
        'J' => 'j',
        'L' => 'l',
        'M' => 'm',
        'N' => 'n',
        'U' => 'u',
        'R' => 'r',
        'Ṛ' => 'ṛ',
        'Ɣ' => 'ɣ',
        'S' => 's',
        'Ṣ' => 'ṣ',
        'C' => 'c',
        'T' => 't',
        'Ṭ' => 'ṭ',
        'W' => 'w',
        'Y' => 'y',
        'Z' => 'z',
        'Ẓ' => 'ẓ',
        'O' => 'o',
        'P' => 'p',
        'V' => 'v',
    ];

    /**
     * The sequence is based on DGLAi, with the labio-velarization mark and
     * the non-standard letters in the end
     */
    private const TO_TIFINAGH = [
        'a' => 'ⴰ',
        'b' => 'ⴱ',
        'g' => 'ⴳ',
        'd' => 'ⴷ',
        'ḍ' => 'ⴹ',
        'e' => 'ⴻ',
        'f' => 'ⴼ',
        'k' => 'ⴽ',
        'h' => 'ⵀ',
        'ḥ' => 'ⵃ',
        'ɛ' => 'ⵄ',
        'x' => 'ⵅ',
        'q' => 'ⵇ',
        'i' => 'ⵉ',
        'j' => 'ⵊ',
        'l' => 'ⵍ',
        'm' => 'ⵎ',
        'n' => 'ⵏ',
        'u' => 'ⵓ',
        'r' => 'ⵔ',
        'ṛ' => 'ⵕ',
        'ɣ' => 'ⵖ',
        's' => 'ⵙ',
        'ṣ' => 'ⵚ',
        'c' => 'ⵛ',
        't' => 'ⵜ',
        'ṭ' => 'ⵟ',
        'w' => 'ⵡ',
        'y' => 'ⵢ',
        'z' => 'ⵣ',
        'ẓ' => 'ⵥ',
        'ʷ' => 'ⵯ',
        'o' => 'ⵓ',
        'p' => 'ⴱ',
        'v' => 'ⴼ',
    ];

    public function getMainCode(): string {
        return 'shi';
    }

    public function getLanguageVariants(): array {
        return [ 'shi', 'shi-tfng', 'shi-latn' ];
    }

    public function getVariantsFallbacks(): array {
        return [
            'shi' => [ 'shi-latn', 'shi-tfng' ],
            'shi-tfng' => 'shi',
            'shi-latn' => 'shi',
        ];
    }

    protected function loadDefaultTables(): array {
        return [
            'lowercase' => new ReplacementArray( self::UPPER_TO_LOWER_CASE_LATIN ),
            'shi-tfng' => new ReplacementArray( self::TO_TIFINAGH ),
            'shi-latn' => new ReplacementArray( self::TO_LATIN ),
            'shi' => new ReplacementArray()
        ];
    }

    public function translate( $text, $toVariant ) {
        // If $text is empty or only includes spaces, do nothing
        // Otherwise translate it
        if ( trim( $text ) ) {
            $this->loadTables();
            // For Tifinagh, first translate uppercase to lowercase Latin
            if ( $toVariant == 'shi-tfng' ) {
                $text = $this->mTables['lowercase']->replace( $text );
            }
            $text = $this->mTables[$toVariant]->replace( $text );
        }
        return $text;
    }
}