From: Nathan TeBlunthuis Date: Thu, 29 May 2025 03:54:52 +0000 (-0700) Subject: Merge branch 'parquet_support' of code:mediawiki_dump_tools into parquet_support X-Git-Url: https://code.communitydata.science/mediawiki_dump_tools.git/commitdiff_plain/8c7d46472f53ec4710a579ba4cf542bec1003854?hp=1aea601a3018bbd5c7b4c67da92fdd7a388d8393 Merge branch 'parquet_support' of code:mediawiki_dump_tools into parquet_support --- diff --git a/wikiq b/wikiq index 2cb0c3a..75c1af8 100755 --- a/wikiq +++ b/wikiq @@ -250,13 +250,13 @@ class RevDataBase(): pa.field("revid", pa.int64()), pa.field("date_time", pa.timestamp('ms')), pa.field("articleid",pa.int64()), - pa.field("editorid",pa.int64()), + pa.field("editorid",pa.int64(), nullable=True), pa.field("title",pa.string()), pa.field("namespace",pa.int32()), pa.field("deleted",pa.bool_()), - pa.field("test_chars",pa.int32()), - pa.field("revert",pa.bool_()), - pa.field("reverteds",pa.list_(pa.int64())), + pa.field("text_chars",pa.int32()), + pa.field("revert",pa.bool_(), nullable=True), + pa.field("reverteds",pa.list_(pa.int64()), nullable=True), pa.field("sha1",pa.string()), pa.field("minor",pa.bool_()), pa.field("editor",pa.string()),