diff options
author | Jochen Topf <jochen@topf.org> | 2015-03-23 17:48:55 +0100 |
---|---|---|
committer | Jochen Topf <jochen@topf.org> | 2015-04-28 21:55:12 +0200 |
commit | c8a334b10512a708d19ed5fd42aa60424290a371 (patch) | |
tree | beabdda90200e1d6629285def16674b4c5553b90 /sources | |
parent | de091284afa48851da7de95f544e75d6800d4e8a (diff) | |
download | taginfo-c8a334b10512a708d19ed5fd42aa60424290a371.tar taginfo-c8a334b10512a708d19ed5fd42aa60424290a371.tar.gz |
Some experimental code to find unicode properties in keys.
OSM allows nearly all unicode characters in keys and values. This is some
experimental code to find keys that contain unusual characters. Currently
this is not run or used in the normal setup, but I thought I'd throw it
out there in case somebody wants to play with it. I am not sure yet myself
where this is going.
Diffstat (limited to 'sources')
-rw-r--r-- | sources/db/pre.sql | 13 | ||||
-rwxr-xr-x | sources/db/update.sh | 3 |
2 files changed, 16 insertions, 0 deletions
diff --git a/sources/db/pre.sql b/sources/db/pre.sql index 9faf613..165dd38 100644 --- a/sources/db/pre.sql +++ b/sources/db/pre.sql @@ -139,3 +139,16 @@ CREATE TABLE prevalent_roles ( fraction REAL ); +DROP TABLE IF EXISTS key_characters; + +CREATE TABLE key_characters ( + key TEXT, + num INTEGER, + utf8 TEXT, + codepoint TEXT, + block INTEGER, + category TEXT, + direction INTEGER, + name TEXT +); + diff --git a/sources/db/update.sh b/sources/db/update.sh index faa5cde..add5a29 100755 --- a/sources/db/update.sh +++ b/sources/db/update.sh @@ -76,6 +76,9 @@ sqlite3 $DATABASE <post_similar_keys.sql echo "`$DATECMD` Running update_characters... " ./update_characters.rb $DIR +#echo "`$DATECMD` Running taginfo_unicode... " +#./taginfo_unicode $DATABASE + echo "`$DATECMD` Running post_grades.sql... " sqlite3 $DATABASE <post_grades.sql |