OSM QA tools:
* fixed parsing of number of inhabitants with html entities * fixed wikipedia name of Grabow
This commit is contained in:
parent
9269781f4e
commit
ead2c41bb3
1 changed files with 3 additions and 1 deletions
|
@ -36,6 +36,7 @@ Dmitz D%C3%B6mitz
|
||||||
Friedland Friedland_(Mecklenburg)
|
Friedland Friedland_(Mecklenburg)
|
||||||
FrstenbergHavel F%C3%BCrstenberg/Havel
|
FrstenbergHavel F%C3%BCrstenberg/Havel
|
||||||
Goldberg Goldberg_(Mecklenburg)
|
Goldberg Goldberg_(Mecklenburg)
|
||||||
|
Grabow Grabow_(Elde)
|
||||||
Malchow Malchow_(Mecklenburg)
|
Malchow Malchow_(Mecklenburg)
|
||||||
OstseebadRerik Rerik
|
OstseebadRerik Rerik
|
||||||
RbelMritz R%C3%B6bel
|
RbelMritz R%C3%B6bel
|
||||||
|
@ -56,11 +57,12 @@ get_place_data() {
|
||||||
|
|
||||||
get_place_size() {
|
get_place_size() {
|
||||||
# call "zcat -f" to uncompress a page if necessary
|
# call "zcat -f" to uncompress a page if necessary
|
||||||
|
# ignore stuff like " " (space) within the number
|
||||||
wget --quiet --output-document - "$WIKIPEDIA_URL/$1" \
|
wget --quiet --output-document - "$WIKIPEDIA_URL/$1" \
|
||||||
| zcat -f \
|
| zcat -f \
|
||||||
| grep -A 1 "^<td>Einwohner:</td>$" \
|
| grep -A 1 "^<td>Einwohner:</td>$" \
|
||||||
| tail -1 | cut -d ">" -f 2 | cut -d "<" -f 1 \
|
| tail -1 | cut -d ">" -f 2 | cut -d "<" -f 1 \
|
||||||
| sed s/[^0-9]//g
|
| sed -r 's/&#[0-9]{3};//g' | sed s/[^0-9]//g
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue