From 13d69ea5301a6da76a798a335b8006d92e6ce0d2 Mon Sep 17 00:00:00 2001 From: Emerson Rocha Date: Wed, 27 Apr 2022 23:52:39 -0300 Subject: [PATCH] 1603_1.py (#29): profile fix empty columns (but not duplicated ix_wikiq yet) refs https://github.com/EticaAI/multilingual-lexicography/issues/29#issuecomment-1111660211 --- officinam/999999999/0/1603_1.py | 5 +++++ officinam/999999999/999999999.lib.sh | 6 ++++-- officinam/999999999/999999_17.sh | 10 ++++++++-- 3 files changed, 17 insertions(+), 4 deletions(-) diff --git a/officinam/999999999/0/1603_1.py b/officinam/999999999/0/1603_1.py index 836e639..116f04b 100755 --- a/officinam/999999999/0/1603_1.py +++ b/officinam/999999999/0/1603_1.py @@ -3706,6 +3706,11 @@ def imprimere(self): else: return [yaml.dump(self.ex_codice(), allow_unicode=True)] + def imprimere_in_csvw(self) -> list: + # https://github.com/w3c/csvw + # https://www.w3.org/TR/tabular-data-primer/ + raise NotImplementedError('TODO') + def imprimere_in_datapackage(self) -> list: """imprimere_in_datapackage diff --git a/officinam/999999999/999999999.lib.sh b/officinam/999999999/999999999.lib.sh index bc15511..b41e98f 100644 --- a/officinam/999999999/999999999.lib.sh +++ b/officinam/999999999/999999999.lib.sh @@ -449,8 +449,8 @@ file_convert_csv_de_downloaded_xlsx() { # type inference. We need better long term solution for this. # sed -i 's/.0,/,/' "$objectivum_archivum_temporarium" - # rm "$objectivum_archivum_temporarium_csv" - # rm "$objectivum_archivum_temporarium" + rm "$objectivum_archivum_temporarium_csv" + rm "$objectivum_archivum_temporarium" file_update_if_necessary csv "$objectivum_archivum_temporarium_csv2" "$objectivum_archivum" } @@ -515,8 +515,10 @@ file_convert_numerordinatio_de_hxltm() { # @TODO: implement NUMERORDINATIO_STATUS_CONCEPTUM_CODICEM_MINIMAM # instead of hardcode 1|2|3|4|5|6|7|8|9 + # hxlcut --exclude="#meta" \ hxlcut --exclude="#meta" \ "$fontem_archivum" | + hxlcut --skip-untagged | hxlselect --query="#item+conceptum+codicem>0" | hxlselect --query='#status+conceptum+codicem~^(1|2|3|4|5|6|7|8|9)$' --reverse | hxladd --before --spec="#item+conceptum+numerordinatio=${_prefix}:{{#item+conceptum+codicem}}" | diff --git a/officinam/999999999/999999_17.sh b/officinam/999999999/999999_17.sh index 9f7b7e6..52adcdb 100755 --- a/officinam/999999999/999999_17.sh +++ b/officinam/999999999/999999_17.sh @@ -71,6 +71,7 @@ file_download_1603_xlsx "1" # actiones_completis_locali "1603_1_2020" # actiones_completis_locali "1603_44_86" # actiones_completis_locali "1603_45_31" +actiones_completis_locali "1603_63_101" # actiones_completis_locali "1603_99_876" # actiones_completis_locali "1603_1_8000" @@ -82,7 +83,12 @@ file_download_1603_xlsx "1" # deploy_0_9_markdown ## Full drill (remote, randon publish few at time) -opus_temporibus_cdn -deploy_0_9_markdown +# opus_temporibus_cdn +# deploy_0_9_markdown # @TODO: maybe check ssdiff (diff spreadsheets) to our uses. + +# https://github.com/frictionlessdata/frictionless-py +# pip3 install frictionless-py +# frictionless validate data/invalid.csv +# frictionless validate 1603/63/101/1603_63_101.no11.tm.hxl.csv