summaryrefslogtreecommitdiff
path: root/sources
diff options
context:
space:
mode:
authorJochen Topf <jochen@topf.org>2015-03-23 17:48:55 +0100
committerJochen Topf <jochen@topf.org>2015-04-28 21:55:12 +0200
commitc8a334b10512a708d19ed5fd42aa60424290a371 (patch)
treebeabdda90200e1d6629285def16674b4c5553b90 /sources
parentde091284afa48851da7de95f544e75d6800d4e8a (diff)
downloadtaginfo-c8a334b10512a708d19ed5fd42aa60424290a371.tar
taginfo-c8a334b10512a708d19ed5fd42aa60424290a371.tar.gz
Some experimental code to find unicode properties in keys.
OSM allows nearly all unicode characters in keys and values. This is some experimental code to find keys that contain unusual characters. Currently this is not run or used in the normal setup, but I thought I'd throw it out there in case somebody wants to play with it. I am not sure yet myself where this is going.
Diffstat (limited to 'sources')
-rw-r--r--sources/db/pre.sql13
-rwxr-xr-xsources/db/update.sh3
2 files changed, 16 insertions, 0 deletions
diff --git a/sources/db/pre.sql b/sources/db/pre.sql
index 9faf613..165dd38 100644
--- a/sources/db/pre.sql
+++ b/sources/db/pre.sql
@@ -139,3 +139,16 @@ CREATE TABLE prevalent_roles (
fraction REAL
);
+DROP TABLE IF EXISTS key_characters;
+
+CREATE TABLE key_characters (
+ key TEXT,
+ num INTEGER,
+ utf8 TEXT,
+ codepoint TEXT,
+ block INTEGER,
+ category TEXT,
+ direction INTEGER,
+ name TEXT
+);
+
diff --git a/sources/db/update.sh b/sources/db/update.sh
index faa5cde..add5a29 100755
--- a/sources/db/update.sh
+++ b/sources/db/update.sh
@@ -76,6 +76,9 @@ sqlite3 $DATABASE <post_similar_keys.sql
echo "`$DATECMD` Running update_characters... "
./update_characters.rb $DIR
+#echo "`$DATECMD` Running taginfo_unicode... "
+#./taginfo_unicode $DATABASE
+
echo "`$DATECMD` Running post_grades.sql... "
sqlite3 $DATABASE <post_grades.sql