Rev 230 | Go to most recent revision | Details | Compare with Previous | Last modification | View Log | RSS feed
| Rev | Author | Line No. | Line | 
|---|---|---|---|
| 223 | PointedEar | 1 | <!DOCTYPE html> | 
| 2 | <html lang="en""> | ||
| 3 | <head> | ||
| 4 | <meta charset="UTF-8"> | ||
| 232 | PointedEar | 5 | <title>Golic Vulcan – Federation Standard English Dictionary</title> | 
| 223 | PointedEar | 6 | <style type="text/css"> | 
| 230 | PointedEar | 7 |       body { | 
| 8 | font-family: serif; | ||
| 9 | } | ||
| 10 | |||
| 11 | ol | ||
| 12 |       { | ||
| 223 | PointedEar | 13 | padding-left: 0; | 
| 14 | list-style-type: none; | ||
| 15 | } | ||
| 16 | |||
| 230 | PointedEar | 17 | ol li | 
| 18 |       { | ||
| 223 | PointedEar | 19 | margin-left: 0; | 
| 20 | } | ||
| 21 | |||
| 230 | PointedEar | 22 | ol ol | 
| 23 |       { | ||
| 223 | PointedEar | 24 | padding-left: 1em; | 
| 25 | } | ||
| 230 | PointedEar | 26 | |
| 27 |       .type-or-context { | ||
| 28 | font-family: sans-serif; | ||
| 29 | font-size: small; | ||
| 30 | font-weight: bold; | ||
| 31 | } | ||
| 32 | |||
| 33 |       i em { | ||
| 34 | font-weight: bold; | ||
| 35 | } | ||
| 223 | PointedEar | 36 | </style> | 
| 37 | </head> | ||
| 38 | |||
| 39 | <body> | ||
| 230 | PointedEar | 40 | <?php | 
| 232 | PointedEar | 41 | $source_lang = 'vuh-Latn-Gol'; | 
| 223 | PointedEar | 42 | $target_lang = 'en-Latn-Federation'; | 
| 232 | PointedEar | 43 | $lines = file('vuh-gol-en.dict'); | 
| 230 | PointedEar | 44 | ?> | 
| 232 | PointedEar | 45 | <h1>Golic Vulcan – Federation Standard English Dictionary</h1> | 
| 230 | PointedEar | 46 |       <?php | 
| 47 | define('REGEXP_PREFIX_EXAMPLE', '/^ex\s*=\s*/'); | ||
| 223 | PointedEar | 48 | |
| 49 | if ($lines) | ||
| 50 |         { | ||
| 51 | $last_indent = -1; | ||
| 52 | $last_phrases = array(); | ||
| 53 | |||
| 54 | foreach ($lines as $line) | ||
| 55 |           { | ||
| 56 | preg_match('/^(?<lws>\s*)(?<phrase>[^:]+)\s*:\s*(?<transl>.+)/u', $line, $matches); | ||
| 57 | // var_dump($matches); | ||
| 58 | if ($matches) | ||
| 59 |             { | ||
| 60 | $phrase = $matches['phrase']; | ||
| 61 | |||
| 62 | if (mb_strpos($phrase, '#') === false) | ||
| 63 |               { | ||
| 64 | $indent = mb_strlen($matches['lws']) / 2; | ||
| 65 | |||
| 66 | if ($indent > $last_indent) | ||
| 67 |                 { | ||
| 68 | echo '<ol>'; | ||
| 69 |                 } | ||
| 70 |                 else | ||
| 71 |                 { | ||
| 72 | echo str_repeat('</ol>', $last_indent - $indent); | ||
| 73 |                 } | ||
| 74 | |||
| 75 | echo '<li>'; | ||
| 76 | |||
| 77 | $is_example = preg_match(REGEXP_PREFIX_EXAMPLE, $phrase); | ||
| 78 | if ($is_example) | ||
| 79 |                 { | ||
| 80 | $phrase = preg_replace(REGEXP_PREFIX_EXAMPLE, '', $phrase); | ||
| 81 |                 } | ||
| 82 | |||
| 83 | if ($indent > $last_indent) | ||
| 84 |                 { | ||
| 85 | $last_phrases[] = $phrase; | ||
| 86 |                 } | ||
| 87 | else if ($indent < $last_indent) | ||
| 88 |                 { | ||
| 89 | $last_phrases = array_slice($last_phrases, 0, $indent + 1); | ||
| 90 |                 } | ||
| 91 | |||
| 92 | if ($indent <= $last_indent) | ||
| 93 |                 { | ||
| 94 | $last_phrases[count($last_phrases) - 1] = $phrase; | ||
| 95 |                 } | ||
| 96 | |||
| 97 | $phrase = preg_replace( | ||
| 98 | array( | ||
| 99 | '/~/', | ||
| 100 | '/[()]/', | ||
| 101 | ), | ||
| 102 | array( | ||
| 103 | '=', | ||
| 104 | '|', | ||
| 105 | ), | ||
| 106 | $phrase); | ||
| 107 | |||
| 108 | if ($last_phrases) | ||
| 109 |                 { | ||
| 110 | end($last_phrases); | ||
| 111 | |||
| 112 | while (($last_phrase = prev($last_phrases)) !== false) | ||
| 113 |                   { | ||
| 114 | while (mb_strlen($last_phrase) > 1) | ||
| 115 |                     { | ||
| 116 | if (preg_match('/' . preg_quote($last_phrase) . '/i', | ||
| 117 | $phrase, $last_sub_matches)) | ||
| 118 |                       { | ||
| 119 | $phrase = preg_replace('/' . $last_sub_matches[0] . '/i', | ||
| 120 | '<u>\\0</u>', $phrase); | ||
| 121 | break 2; | ||
| 122 |                       } | ||
| 123 | |||
| 124 | $last_phrase = mb_strcut($last_phrase, 0, mb_strlen($last_phrase) - 1); | ||
| 125 |                     } | ||
| 126 |                   } | ||
| 127 |                 } | ||
| 128 | |||
| 129 | $transl = preg_replace( | ||
| 130 | array( | ||
| 131 | '/"([^"]+)"/', | ||
| 230 | PointedEar | 132 | '/\{([^\}]+)\}/', | 
| 133 | '/(^|[\\s+\\[])\\/([\\s\\w\'()-]+)\\/(?=[,.;:\\s+\\]]|$)/u', | ||
| 223 | PointedEar | 134 | '/\|(.*)(?<!\|)/', | 
| 230 | PointedEar | 135 | '/\*(.+?)\*/', | 
| 223 | PointedEar | 136 | '/\\s+~/', | 
| 137 | ), | ||
| 138 | array( | ||
| 139 | '“\\1”', | ||
| 230 | PointedEar | 140 | '<abbr class="type-or-context" lang="' . $target_lang . '">\\1</abbr>', | 
| 141 | '\\1<i lang="' . $source_lang . '">\\2</i>', | ||
| 223 | PointedEar | 142 | '/\\1', | 
| 230 | PointedEar | 143 | '<em>\\1</em>', | 
| 223 | PointedEar | 144 | ' ~', | 
| 145 | ), | ||
| 224 | PointedEar | 146 | $matches['transl']); | 
| 223 | PointedEar | 147 | |
| 148 | echo ($is_example ? "<i lang='$source_lang'>" : "<b lang='$source_lang'>") | ||
| 149 | . $phrase | ||
| 150 | . ($is_example ? '</i>' : '</b>') | ||
| 151 | . " <span lang='$target_lang'>" . $transl . '</span>'; | ||
| 152 | |||
| 153 | $last_indent = $indent; | ||
| 154 |               } | ||
| 155 |             } | ||
| 156 |           } | ||
| 230 | PointedEar | 157 | echo '</ol>'; | 
| 158 | |||
| 159 | //           $phrases = array(); | ||
| 160 | |||
| 161 | //           foreach ($lines as $line) | ||
| 162 | //           { | ||
| 163 | //             preg_match('/^(?<lws>\s*)(?<phrase>[^:]+)\s*:\s*(?<transl>.+)/u', $line, $matches); | ||
| 164 | //             if ($matches) | ||
| 165 | //             { | ||
| 166 | //               $phrase = $matches['phrase']; | ||
| 167 | |||
| 168 | //               /* if not a comment */ | ||
| 169 | //               if (mb_strpos($phrase, '#') === false) | ||
| 170 | //               { | ||
| 171 | //                 $transl = $matches['transl']; | ||
| 172 | |||
| 173 | //                 $is_example = preg_match(REGEXP_PREFIX_EXAMPLE, $phrase); | ||
| 174 | //                 if ($is_example) | ||
| 175 | //                 { | ||
| 176 | //                   /* assign example to previous phrase; indentation irrelevant */ | ||
| 177 | //                   $phrase = preg_replace(REGEXP_PREFIX_EXAMPLE, '', $phrase); | ||
| 178 | |||
| 179 | //                   $prev_phrase['examples'][$phrase] = $transl; | ||
| 180 | //                 } | ||
| 181 | //                 else | ||
| 182 | //                 { | ||
| 183 | //                   /* create new phrase */ | ||
| 184 | //                   $level = mb_strlen($matches['lws']) / 2; | ||
| 185 | |||
| 186 | //                   $phrases[$phrase] = array( | ||
| 187 | //                     'translation' => $transl, | ||
| 188 | //                     'level' => $level | ||
| 189 | //                   ); | ||
| 190 | //                   $prev_phrase =& $phrases[$phrase]; | ||
| 191 | //                 } | ||
| 192 | //               } | ||
| 193 | //             } | ||
| 194 | //           } | ||
| 195 | |||
| 196 | // //           var_dump($phrases); | ||
| 197 | |||
| 198 | //           if ($phrases) | ||
| 199 | //           { | ||
| 200 | //             $prev_level = -1; | ||
| 201 | |||
| 202 | //             foreach ($phrases as $phrase => $data) | ||
| 203 | //             { | ||
| 204 | //               $level = $data['level']; | ||
| 205 | |||
| 206 | //               if ($level > $prev_level) | ||
| 207 | //               { | ||
| 208 | //                 echo "\n<ol>\n"; | ||
| 209 | //               } | ||
| 210 | //               else if ($level < $prev_level) | ||
| 211 | //               { | ||
| 212 | //                 echo str_repeat("</ol>\n", $prev_level - $level); | ||
| 213 | //               } | ||
| 214 | |||
| 215 | //               $translation = $data['translation']; | ||
| 216 | |||
| 217 | //               echo "\n<li>$prev_level => $level <b lang='$source_lang'>" . htmlspecialchars($phrase) . '</b>' | ||
| 218 | //                 . " <span lang='$target_lang'>" . $translation . '</span>'; | ||
| 219 | |||
| 220 | //               if (isset($data['examples'])) | ||
| 221 | //               { | ||
| 222 | //                 echo '<ul>'; | ||
| 223 | |||
| 224 | //                 foreach ($data['examples'] as $original => $translation) | ||
| 225 | //                 { | ||
| 226 | //                   echo "<li><i lang='$source_lang'>" . htmlspecialchars($original) . '</i>' | ||
| 227 | //                     . " <span lang='$target_lang'>" . $translation . '</span></li>'; | ||
| 228 | //                 } | ||
| 229 | |||
| 230 | //                 echo '</ul>'; | ||
| 231 | //               } | ||
| 232 | |||
| 233 | //               $prev_level = $level; | ||
| 234 | //             } | ||
| 235 | |||
| 236 | //             echo '</ol>'; | ||
| 237 | //           } | ||
| 223 | PointedEar | 238 |         ?> | 
| 230 | PointedEar | 239 | <?php } ?> | 
| 223 | PointedEar | 240 | </body> | 
| 241 | </html> |