def __init__(self, page, namespace_map, collapse_user=False):
self.id = page.id
self.namespace = page.namespace
+ # following mwxml, we assume namespace 0 in cases where
+ # page.namespace is inconsistent with namespace_map
+ if page.namespace not in namespace_map:
+ self.title = page.title
+ page.namespace = 0
if page.namespace != 0:
self.title = ':'.join([namespace_map[page.namespace], page.title])
else:
parser.add_argument('-u', '--url-encode', dest="urlencode", action="store_true",
help="Output url encoded text strings. This works around some data issues like newlines in editor names. In the future it may be used to output other text data.")
+parser.add_argument('-ns', '--namespace-filter', dest="namespace_filter", type=str, help="Comma-seperate list of namespaces numbers to include")
+
+
args = parser.parse_args()
# set persistence method