diff options
author | Danjela Lura <danielaluraa@gmail.com> | 2020-06-11 19:04:01 +0200 |
---|---|---|
committer | Christopher Baines <mail@cbaines.net> | 2020-06-19 16:03:32 +0100 |
commit | 8d9a4d105c6bda93e75609ac09102a6953c28c9e (patch) | |
tree | d7fc700f9c48cba3b45fe3cd248652c16a368664 | |
parent | 308e553b11792bc2c06320ac970a06eb2e8a3447 (diff) | |
download | data-service-8d9a4d105c6bda93e75609ac09102a6953c28c9e.tar data-service-8d9a4d105c6bda93e75609ac09102a6953c28c9e.tar.gz |
Get the translated package synopsis and descriptions into the database
Signed-off-by: Christopher Baines <mail@cbaines.net>
6 files changed, 282 insertions, 15 deletions
diff --git a/guix-data-service/jobs/load-new-guix-revision.scm b/guix-data-service/jobs/load-new-guix-revision.scm index 34809b0..9cc4ef4 100644 --- a/guix-data-service/jobs/load-new-guix-revision.scm +++ b/guix-data-service/jobs/load-new-guix-revision.scm @@ -735,7 +735,7 @@ WHERE job_id = $1" (packages-metadata-ids (with-time-logging "fetching inferior package metadata" (inferior-packages->package-metadata-ids - conn packages package-license-set-ids)))) + conn inf packages package-license-set-ids)))) (with-time-logging "getting package-ids" (inferior-packages->package-ids diff --git a/guix-data-service/model/package-metadata.scm b/guix-data-service/model/package-metadata.scm index e2166d5..6180274 100644 --- a/guix-data-service/model/package-metadata.scm +++ b/guix-data-service/model/package-metadata.scm @@ -24,12 +24,32 @@ #:use-module (gcrypt hash) #:use-module (rnrs bytevectors) #:use-module (guix base16) + #:use-module (guix packages) + #:use-module (guix i18n) #:use-module (guix inferior) #:use-module (guix-data-service model location) #:use-module (guix-data-service model utils) #:export (select-package-metadata-by-revision-name-and-version inferior-packages->package-metadata-ids)) +(define locales + '("cs_CZ.utf8" + "da_DK.utf8" + "de_DE.utf8" + "eo_EO.utf8" + "es_ES.utf8" + "fr_FR.utf8" + "hu_HU.utf8" + "pl_PL.utf8" + "pt_BR.utf8" + ;;"sr_SR.utf8" + "sv_SE.utf8" + "vi_VN.utf8" + "zh_CN.utf8")) + +(define inferior-package-id + (@@ (guix inferior) inferior-package-id)) + (define (select-package-metadata package-metadata-values) (define fields '("synopsis" "description" "home_page" "location_id" "license_set_id")) @@ -144,36 +164,199 @@ WHERE packages.id IN ( " RETURNING id" ";")) +(define (inferior-packages->translated-package-descriptions-and-synopsis inferior + inferior-package-id) + + (define (translate inferior-package-id) + `(let* ((package (hashv-ref %package-table ,inferior-package-id)) + (source-locale "en_US.utf8") + (source-synopsis + (begin + (setlocale LC_MESSAGES source-locale) + (P_ (package-synopsis package)))) + (source-description + (begin + (setlocale LC_MESSAGES source-locale) + (P_ (package-description package)))) + (synopsis-by-locale + (filter-map + (lambda (locale) + (catch 'system-error + (lambda () + (setlocale LC_MESSAGES locale)) + (lambda (key . args) + (error + (simple-format + #f + "error changing locale to ~A: ~A ~A" + locale key args)))) + (let ((synopsis + (P_ (package-synopsis package)))) + (setlocale LC_MESSAGES source-locale) + (if (string=? synopsis source-synopsis) + #f + (cons locale synopsis)))) + (list ,@locales))) + (descriptions-by-locale + (filter-map + (lambda (locale) + (catch 'system-error + (lambda () + (setlocale LC_MESSAGES locale)) + (lambda (key . args) + (error + (simple-format + #f + "error changing locale to ~A: ~A ~A" + locale key args)))) + (let ((description + (P_ (package-description package)))) + (setlocale LC_MESSAGES source-locale) + (if (string=? description source-description) + #f + (cons locale description)))) + (list ,@locales)))) + (cons + (cons (cons source-locale source-description) + descriptions-by-locale) + (cons (cons source-locale source-synopsis) + synopsis-by-locale)))) + + (inferior-eval (translate inferior-package-id) inferior)) + +(define (package-synopsis-data->package-synopsis-ids + conn synopsis-by-locale) + (insert-missing-data-and-return-all-ids + conn + "package_synopsis" + '(locale synopsis) + (map (match-lambda + ((locale . synopsis) + (list locale synopsis))) + synopsis-by-locale) + #:delete-duplicates? #t)) + +(define (insert-package-synopsis-set conn package-synopsis-ids) + (let ((query + (string-append + "INSERT INTO package_synopsis_sets (synopsis_ids) VALUES " + (string-append + "('{" + (string-join + (map number->string + (sort package-synopsis-ids <)) + ", ") + "}')") + " RETURNING id"))) + (match (exec-query conn query) + (((id)) id)))) + +(define (package-synopsis-data->package-synopsis-set-id + conn synopsis-by-locale) + (let* ((package-synopsis-ids + (package-synopsis-data->package-synopsis-ids + conn + synopsis-by-locale)) + (package-synopsis-set-id + (exec-query + conn + (string-append + "SELECT id FROM package_synopsis_sets" + " WHERE synopsis_ids = ARRAY[" + (string-join (map number->string + (sort package-synopsis-ids <)) ", ") + "]")))) + (string->number + (match package-synopsis-set-id + (((id)) id) + (() + (insert-package-synopsis-set conn package-synopsis-ids)))))) + +(define (package-description-data->package-description-ids + conn descriptions-by-locale) + (insert-missing-data-and-return-all-ids + conn + "package_descriptions" + '(locale description) + (map (match-lambda + ((locale . description) + (list locale description))) + descriptions-by-locale) + #:delete-duplicates? #t)) + +(define (insert-package-description-set conn package-description-ids) + (let ((query + (string-append + "INSERT INTO package_description_sets (description_ids) VALUES " + (string-append + "('{" + (string-join + (map number->string + (sort package-description-ids <)) + ", ") + "}')") + " RETURNING id"))) + (match (exec-query conn query) + (((id)) id)))) + +(define (package-description-data->package-description-set-id + conn descriptions-by-locale) + (let* ((package-description-ids + (package-description-data->package-description-ids + conn + descriptions-by-locale)) + (package-description-set-id + (exec-query + conn + (string-append + "SELECT id FROM package_description_sets" + " WHERE description_ids = ARRAY[" + (string-join (map number->string + (sort package-description-ids <)) ", ") + "]")))) + (string->number + (match package-description-set-id + (((id)) id) + (() + (insert-package-description-set conn package-description-ids)))))) (define (inferior-packages->package-metadata-ids conn + inferior packages license-set-ids) (define package-metadata (map (lambda (package license-set-id) - (list (inferior-package-synopsis package) - (inferior-package-description package) - (non-empty-string-or-false - (inferior-package-home-page package)) - (location->location-id - conn - (inferior-package-location package)) - license-set-id)) + (let ((translated-package-descriptions-and-synopsis + (inferior-packages->translated-package-descriptions-and-synopsis + inferior (inferior-package-id package)))) + (list (non-empty-string-or-false + (inferior-package-home-page package)) + (location->location-id + conn + (inferior-package-location package)) + license-set-id + (package-description-data->package-description-set-id + conn + (car translated-package-descriptions-and-synopsis)) + (package-synopsis-data->package-synopsis-set-id + conn + (cdr translated-package-descriptions-and-synopsis))))) packages license-set-ids)) (insert-missing-data-and-return-all-ids conn "package_metadata" - '(synopsis description home_page location_id license_set_id) + '(home_page location_id license_set_id package_description_set_id package_synopsis_set_id) (map (match-lambda - ((synopsis description home-page location-id license-set-id) - (list synopsis - description - (if (string? home-page) + ((home-page location-id license-set-id package_description_set_id package_synopsis_set_id) + (list (if (string? home-page) home-page NULL) location-id - license-set-id))) + license-set-id + package_description_set_id + package_synopsis_set_id))) package-metadata) ;; There can be duplicated entires in package-metadata, for example where ;; you have one package definition which interits from another, and just diff --git a/sqitch/deploy/translations_for_package_synopsis_and_descriptions.sql b/sqitch/deploy/translations_for_package_synopsis_and_descriptions.sql new file mode 100644 index 0000000..627ea93 --- /dev/null +++ b/sqitch/deploy/translations_for_package_synopsis_and_descriptions.sql @@ -0,0 +1,69 @@ +-- Deploy guix-data-service:translations_for_package_synopsis_and_descriptions to pg + +BEGIN; + +CREATE TABLE package_descriptions ( + id integer PRIMARY KEY GENERATED ALWAYS AS IDENTITY, + locale varchar NOT NULL, + description varchar NOT NULL, + UNIQUE (locale, description) +); + +CREATE TABLE package_description_sets ( + id integer PRIMARY KEY GENERATED ALWAYS AS IDENTITY, + description_ids integer[] NOT NULL, + UNIQUE (description_ids) +); + +CREATE TABLE package_synopsis ( + id integer PRIMARY KEY GENERATED ALWAYS AS IDENTITY, + locale varchar NOT NULL, + synopsis varchar NOT NULL, + UNIQUE (locale, synopsis) +); + +CREATE TABLE package_synopsis_sets ( + id integer PRIMARY KEY GENERATED ALWAYS AS IDENTITY, + synopsis_ids integer[] NOT NULL, + UNIQUE (synopsis_ids) +); + +ALTER TABLE package_metadata ADD COLUMN package_description_set_id integer REFERENCES package_description_sets (id); + +ALTER TABLE package_metadata ADD COLUMN package_synopsis_set_id integer REFERENCES package_synopsis_sets (id); + +INSERT INTO package_descriptions (locale, description) +SELECT DISTINCT 'en_US.utf8', description + FROM package_metadata; + +INSERT INTO package_description_sets (description_ids) +SELECT ARRAY[id] FROM package_descriptions; + +INSERT INTO package_synopsis (locale, synopsis) +SELECT DISTINCT 'en_US.utf8', synopsis + FROM package_metadata; + +INSERT INTO package_synopsis_sets (synopsis_ids) +SELECT ARRAY[id] FROM package_synopsis; + +UPDATE package_metadata + SET package_description_set_id = + package_description_sets.id + FROM package_description_sets + INNER JOIN package_descriptions + ON package_description_sets.description_ids[1] = package_descriptions.id + WHERE package_descriptions.description = package_metadata.description; + +UPDATE package_metadata + SET package_synopsis_set_id = + package_synopsis_sets.id + FROM package_synopsis_sets + INNER JOIN package_synopsis + ON package_synopsis_sets.synopsis_ids[1] = package_synopsis.id + WHERE package_synopsis.synopsis = package_metadata.synopsis; + +ALTER TABLE package_metadata DROP COLUMN description; + +ALTER TABLE package_metadata DROP COLUMN synopsis; + +COMMIT; diff --git a/sqitch/revert/translations_for_package_synopsis_and_descriptions.sql b/sqitch/revert/translations_for_package_synopsis_and_descriptions.sql new file mode 100644 index 0000000..00a6fc3 --- /dev/null +++ b/sqitch/revert/translations_for_package_synopsis_and_descriptions.sql @@ -0,0 +1,7 @@ +-- Revert guix-data-service:translations_for_package_synopsis_and_descriptions from pg + +BEGIN; + +-- XXX Add DDLs here. + +COMMIT; diff --git a/sqitch/sqitch.plan b/sqitch/sqitch.plan index 911c43b..dc0d147 100644 --- a/sqitch/sqitch.plan +++ b/sqitch/sqitch.plan @@ -60,3 +60,4 @@ remove_odd_package_derivations 2020-04-24T20:36:06Z Christopher Baines <mail@cba build_servers_lookup_builds 2020-05-24T15:18:09Z Christopher Baines <mail@cbaines.net> # Add build_servers.lookup_builds make_nar_urls_file_size_optional 2020-06-03T05:27:29Z Christopher Baines <mail@cbaines.net> # Make the nar_urls.file_size optional translations_for_lint_checker_descriptions 2020-05-22T19:49:37Z daniela <daniela@linux-ijv5> # Support translations for lint checker descriptions +translations_for_package_synopsis_and_descriptions 2020-06-09T12:42:54Z daniela <daniela@linux-ijv5> # Support translations for package synopsis and descriptions diff --git a/sqitch/verify/translations_for_package_synopsis_and_descriptions.sql b/sqitch/verify/translations_for_package_synopsis_and_descriptions.sql new file mode 100644 index 0000000..a93c379 --- /dev/null +++ b/sqitch/verify/translations_for_package_synopsis_and_descriptions.sql @@ -0,0 +1,7 @@ +-- Verify guix-data-service:translations_for_package_synopsis_and_descriptions on pg + +BEGIN; + +-- XXX Add verifications here. + +ROLLBACK; |