(* List of Russian names from mycoweb-stv.ru *)
maintainRussianSvetlova := (
url = "http://mycoweb-stv.ru/spisok_vidov/rus-lat/index.html";
file = "mushrooms-russian-svetlova.htm";
match0 =
"\:0430\:0432\:0442\:043e\:0440\:043e\:0432 \:0438 \:043d\:0430\
\:0441\:0442\:043e\:044f\:0449\:0435\:0433\:043e \:0441\:0430\:0439\
\:0442\:0430" ~~ __ ~~ "";
match0a = "
" ~~ __ ~~ "
";
match = RegularExpression[
"(?i)\\s*(.{3,50}?)\\s* [-]\\s*(.{3,50}?)\\s*
"];
urlsave[url, file, textcondit];
text = Import[file, "TEXT"];
text = StringCases[text, match0];
If[text === {}, Print["Error: no match: ", match0]];
text = text[[1]];
text = StringCases[text, match0a];
If[text === {}, Print["Error: no match: ", match0a]];
text = text[[1]];
data = StringCases[text, match -> {"$2", "$1"}];
Print["Found ", Length[data], " names in file ", file, " -> rusnames5"];
printnames[data // TableForm];
rusnames5 = updatenames[data];
rusnames5a =
Select[rusnames5,
StringFreeQ[#[[2]], {".", RegularExpression["[0-9]"]}] &];
rusnames5a = Table[
{name, syns} = dat;
syns = StringSplit[syns, {" " ... ~~ "(" ~~ " " ..., " " ... ~~ ")" ~~ " " ...}];
{name, syns}, {dat, rusnames5a}];
);