'Settings', 'file path' => drupal_get_path('module', 'system'), 'weight' => -10, 'type' => MENU_DEFAULT_LOCAL_TASK, ); $items['admin/settings/file-system/transliteration'] = array( 'title' => 'Transliteration', 'description' => 'Convert existing file names to US-ASCII.', 'page callback' => 'drupal_get_form', 'page arguments' => array('transliteration_retroactive'), 'access arguments' => array('administer site configuration'), 'file' => 'transliteration.admin.inc', 'weight' => 10, 'type' => MENU_LOCAL_TASK, ); return $items; } /** * Implements hook_form_FORM_ID_alter(). * * Add transliteration settings to the file system configuration form. */ function transliteration_form_system_file_system_settings_alter(&$form, &$form_state) { $form['transliteration'] = array( '#type' => 'item', '#title' => t('Transliteration'), '#value' => '', ); $form['transliteration']['transliteration_file_uploads'] = array( '#type' => 'checkbox', '#title' => t('Transliterate file names during upload.'), '#description' => t('Enable to convert file names to US-ASCII character set for cross-platform compatibility.'), '#default_value' => variable_get('transliteration_file_uploads', TRUE), ); $form['transliteration']['transliteration_file_lowercase'] = array( '#type' => 'checkbox', '#title' => t('Lowercase transliterated file names.'), '#default_value' => variable_get('transliteration_file_lowercase', TRUE), '#description' => t('This is a recommended setting to prevent issues with case-insensitive file systems. It has no effect if transliteration has been disabled.'), ); $form['buttons']['#weight'] = 1; } /** * Transliterate and sanitize a file name. * * The resulting file name has white space replaced with underscores, consists * of only US-ASCII characters, and is converted to lowercase (if configured). * * @param $filename * A file name. * @param $source_langcode * Optional ISO 639 language code that denotes the language of the input and * is used to apply language-specific variations. If the source language is * not known at the time of transliteration, it is recommended to set this * argument to the site default language to produce consistent results. * Otherwise the current display language will be used. * @return * Sanitized file name. * * @see language_default() */ function transliteration_clean_filename($filename, $source_langcode = NULL) { $filename = transliteration_get($filename, '', $source_langcode); // Replace whitespace. $filename = str_replace(' ', '_', $filename); // Remove remaining unsafe characters. $filename = preg_replace('![^0-9A-Za-z_.-]!', '', $filename); // Force lowercase to prevent issues on case-insensitive file systems. if (variable_get('transliteration_file_lowercase', TRUE)) { $filename = strtolower($filename); } return $filename; } /** * Transliterate text. * * Takes an input string in any language and character set, and tries to * represent it in US-ASCII characters by conveying, in Roman letters, the * pronunciation expressed by the text in some other writing system. * * @param $text * UTF-8 encoded text input. * @param $unknown * Replacement string for characters that do not have a suitable ASCII * equivalent. * @param $source_langcode * Optional ISO 639 language code that denotes the language of the input and * is used to apply language-specific variations. If the source language is * not known at the time of transliteration, it is recommended to set this * argument to the site default language to produce consistent results. * Otherwise the current display language will be used. * @return * Transliterated text. * * @see language_default() */ function transliteration_get($text, $unknown = '?', $source_langcode = NULL) { static $loaded = FALSE; if (!$loaded) { module_load_include('inc', 'transliteration'); $loaded = TRUE; } return transliteration_process($text, $unknown, $source_langcode); } /** * Implementation of hook_init(). * * Sanitize file names during upload. */ function transliteration_init() { if (!empty($_FILES['files']) && variable_get('transliteration_file_uploads', TRUE)) { // Figure out language, which is available in $_POST['language'] for node // forms. $langcode = NULL; if (!empty($_POST['language'])) { $languages = language_list(); if (isset($languages[$_POST['language']])) { $langcode = $_POST['language']; } } foreach ($_FILES['files']['name'] as $field => $filename) { // Keep a copy of the unaltered file name. $_FILES['files']['orig_name'][$field] = $filename; $_FILES['files']['name'][$field] = transliteration_clean_filename($filename, $langcode); } } }