(Update package: OSW Core) |
Tag: Undo |
||
(14 intermediate revisions by 3 users not shown) | |||
Line 1: | Line 1: | ||
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSW7d7193567ea14e4e89b74de88983b718", slot="jsondata"}).json, debug=true, mode="header"})) | |||
local lustache = require("Module:Lustache") | local lustache = require("Module:Lustache") | ||
Line 5: | Line 7: | ||
p.keys = { --jsonschema / json-ld keys | p.keys = { --jsonschema / json-ld keys | ||
category='type', | category='type', | ||
category_pseudoproperty='Category', -- Property:Category | |||
subcategory='subclass_of', | subcategory='subclass_of', | ||
schema_type='schema_type', | schema_type='schema_type', | ||
Line 20: | Line 23: | ||
} | } | ||
p.slots = { --slot names | p.slots = { --slot names | ||
main='main', | |||
jsondata='jsondata', | jsondata='jsondata', | ||
jsonschema='jsonschema', | jsonschema='jsonschema', | ||
Line 31: | Line 35: | ||
query='query' | query='query' | ||
} | } | ||
p.cache = {} | |||
--loads json from a wiki page | --loads json from a wiki page | ||
Line 37: | Line 43: | ||
function p.loadJson(args) | function p.loadJson(args) | ||
local page_title = p.defaultArg(args.title, "JsonSchema:Entity") --for testing | local page_title = p.defaultArg(args.title, "JsonSchema:Entity") --for testing | ||
local slot = p.defaultArg(args.slot, | local slot = p.defaultArg(args.slot, 'main') | ||
local debug = p.defaultArg(args.debug, nil) | local debug = p.defaultArg(args.debug, nil) | ||
local msg = "" | local msg = "" | ||
Line 43: | Line 49: | ||
local json = {} | local json = {} | ||
if (slot == | if p.cache[page_title] ~= nil then | ||
if p.cache[page_title][slot] ~= nil then | |||
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. " from cache <br>" end | |||
json = p.cache[page_title][slot] | |||
return {json=json, debug_msg=msg} | |||
end | |||
else p.cache[page_title] = {} | |||
end | |||
if (slot == 'main') then | |||
--json = mw.loadJsonData( "JsonSchema:Entity" ) --requires MediaWiki 1.39 | --json = mw.loadJsonData( "JsonSchema:Entity" ) --requires MediaWiki 1.39 | ||
local page = mw.title.makeTitle(p.splitString(page_title, ':')[1], p.splitString(page_title, ':')[2]) | local page = mw.title.makeTitle(p.splitString(page_title, ':')[1], p.splitString(page_title, ':')[2]) | ||
Line 49: | Line 64: | ||
if (text ~= nil) then json = mw.text.jsonDecode(text) end | if (text ~= nil) then json = mw.text.jsonDecode(text) end | ||
else | else | ||
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " | if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. "<br>" end | ||
local text = mw.slots.slotContent( slot , page_title ) | local text = mw.slots.slotContent( slot , page_title ) | ||
if (text ~= nil) then json = mw.text.jsonDecode(text) end | if (text ~= nil) then json = mw.text.jsonDecode(text) end | ||
end | end | ||
local generated_content = json["$defs"] and json["$defs"]["generated"] | |||
if generated_content then | |||
-- Check if "$ref": "#/$defs/generated" exists directly in the table | |||
if json["$ref"] == "#/$defs/generated" then | |||
json = p.tableMerge(p.copy(generated_content), json) | |||
json["$ref"] = nil -- Remove the reference after merging | |||
end | |||
-- Check if "$ref": "#/$defs/generated" is contained in "allOf" | |||
if json["allOf"] then | |||
for _, item in ipairs(json["allOf"]) do | |||
if item["$ref"] == "#/$defs/generated" then | |||
-- Remove the reference after merging | |||
for i, v in ipairs(json["allOf"]) do | |||
if v["$ref"] == "#/$defs/generated" then | |||
table.remove(json["allOf"], i) | |||
break | |||
end | |||
end | |||
json = p.tableMerge(p.copy(generated_content), json) | |||
break | |||
end | |||
end | |||
end | |||
json["$defs"]["generated"] = nil | |||
end | |||
--[[local defs = p.defaultArgPath(json, {"$defs", "generated"}, nil) | |||
if defs == nil then defs = p.defaultArgPath(json, {"definitions", "generated"}, nil) end | |||
if defs ~= nil then | |||
json = p.tableMerge(p.copy(defs), json) | |||
json["allOf"] = p.tableMerge(json["allOf"], p.copy(defs["allOf"])) | |||
end]]-- | |||
--mw.logObject(json) | --mw.logObject(json) | ||
p.cache[page_title][slot] = json | |||
return {json=json, debug_msg=msg} | return {json=json, debug_msg=msg} | ||
end | end | ||
-- test: mw.logObject(p.walkJsonSchema({jsonschema=p.loadJson({title="Category:Hardware", slot="jsonschema"}).json, debug=true}).jsonschema) | -- test: mw.logObject(p.walkJsonSchema({jsonschema=p.loadJson({title="Category:Hardware", slot="jsonschema"}).json, debug=true}).jsonschema) | ||
Line 67: | Line 122: | ||
local mode = p.defaultArg(args.mode, p.mode.header) | local mode = p.defaultArg(args.mode, p.mode.header) | ||
--local merged_jsonschema = p.defaultArg(args.merged_jsonschema, {}) | --local merged_jsonschema = p.defaultArg(args.merged_jsonschema, {}) | ||
local template = p.defaultArg(args.template, nil) | |||
local templates = p.defaultArg(args.templates, {}) | local templates = p.defaultArg(args.templates, {}) | ||
local recursive = p.defaultArg(args.recursive, true) | local recursive = p.defaultArg(args.recursive, true) | ||
Line 78: | Line 134: | ||
if (mode == p.mode.header) then category_template_slot = p.slots.header_template end | if (mode == p.mode.header) then category_template_slot = p.slots.header_template end | ||
if (categories == nil) then categories = p.getCategories({jsonschema=jsonschema, includeNamespace=true}).categories end | if (categories == nil) then categories = p.getCategories({jsonschema=jsonschema, includeNamespace=true, includeSchemas=true}).categories end | ||
if (type(categories) ~= 'table') then categories = {categories} end | if (type(categories) ~= 'table') then categories = {categories} end | ||
if (debug) then msg = msg .. "Supercategories: " .. mw.dumpObject(categories) .. "\n<br>" end | if (debug) then msg = msg .. "Supercategories: " .. mw.dumpObject(categories) .. "\n<br>" end | ||
Line 85: | Line 141: | ||
--mw.logObject("Visit " .. category) | --mw.logObject("Visit " .. category) | ||
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsonschema .. " from page " .. category .. "\n<br>" end | if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsonschema .. " from page " .. category .. "\n<br>" end | ||
local | local super_jsonschema = nil | ||
if ( | if p.splitString(category, ':')[1] == "JsonSchema" then super_jsonschema = p.loadJson({title=category, slot=p.slots.main}).json | ||
else super_jsonschema = p.loadJson({title=category, slot=p.slots.jsonschema}).json end | |||
mw.logObject("INSERT") | |||
mw.logObject(super_jsonschema) | |||
if (super_jsonschema ~= nil) then | |||
if (recursive) then | if (recursive) then | ||
local res = p.walkJsonSchema({jsonschema=super_jsonschema, jsonschemas=jsonschemas, templates=templates, mode=mode, visited=visited, root=false}) | local res = p.walkJsonSchema({jsonschema=super_jsonschema, jsonschemas=jsonschemas, templates=templates, mode=mode, visited=visited, root=false}) | ||
Line 96: | Line 155: | ||
--mw.logObject("Store " .. category) | --mw.logObject("Store " .. category) | ||
table.insert(visited, category) | table.insert(visited, category) | ||
jsonschemas[category] = | |||
jsonschemas[category] = p.copy( super_jsonschema ) --keep a copy of the schema, super_jsonschema passed by references gets modified | |||
--jsonschema = p.tableMerge(jsonschema, super_jsonschema) --merge superschema is done by the caller | --jsonschema = p.tableMerge(jsonschema, super_jsonschema) --merge superschema is done by the caller | ||
end | end | ||
Line 104: | Line 164: | ||
end | end | ||
end | end | ||
if (root and p.tableLength(jsonschema) > 0) then | |||
table.insert(visited, "_") -- dummy category for own schema | |||
jsonschemas["_"] = p.copy(jsonschema) | |||
templates["_"] = template | |||
end | |||
if (root) then | if (root) then | ||
for i, category in ipairs(visited) do | for i, category in ipairs(visited) do | ||
jsonschema = p.tableMerge(jsonschema, jsonschemas[category]) | --merge all schemas. we need to make a copy here, otherwise jsonschemas["Category:Entity"] contains the merged schema | ||
jsonschema = p.copy(p.tableMerge(jsonschema, jsonschemas[category])) | |||
end | end | ||
end | end | ||
Line 134: | Line 199: | ||
local msg = "" | local msg = "" | ||
local res = p.defaultArg(args.jsondata, "") | local res = p.defaultArg(args.jsondata, "") | ||
local root = p.defaultArg(args.root, true) -- first entry into recursion | |||
for k,v in pairs(jsondata) do | for k,v in pairs(jsondata) do | ||
Line 149: | Line 215: | ||
-- mustache can handle objects and array to we can parse it directly | -- mustache can handle objects and array to we can parse it directly | ||
-- todo: handle nested templates | -- todo: handle nested templates | ||
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( | local template_param = {[k]=v} | ||
jsondata[k] = lustache:render(eval_template.value, { | if (eval_template.root_key == false) then template_param = v end | ||
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( template_param ) .. "\n<br>" end | |||
jsondata[k] = lustache:render(eval_template.value, template_param, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion | |||
if (eval_template.type == "mustache-wikitext") then | if (eval_template.type == "mustache-wikitext") then | ||
jsondata[k] = frame:preprocess( jsondata[k] ) | jsondata[k] = frame:preprocess( jsondata[k] ) | ||
end | end | ||
elseif type(v) == 'table' then | elseif type(v) == 'table' then | ||
if (v[1] == nil) then --key value array = object/dict | if (p.tableLength(v) > 0 and v[1] == nil) then --key value array = object/dict | ||
local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=v, template=eval_template, mode=mode, stringify_arrays=stringify_arrays}) | local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=v, jsonschema=p.defaultArgPath(jsonschema, {"properties", k}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays, root=false}) | ||
msg = msg .. sub_res.debug_msg | msg = msg .. sub_res.debug_msg | ||
jsondata[k] = sub_res.res | jsondata[k] = sub_res.res | ||
Line 163: | Line 231: | ||
local string_list = "" | local string_list = "" | ||
for i,e in pairs(v) do | for i,e in pairs(v) do | ||
local eval_template = nil | |||
local eval_templates = p.defaultArgPath(jsonschema, {"properties", k, "items", p.keys.template}, {}) | |||
if (eval_templates[1] == nil) then eval_templates = {eval_templates} end --ensure list of objects | |||
for i, t in pairs(eval_templates) do | |||
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then eval_template = t --use only render templates in render mode and store templates in store mode | |||
elseif (t[p.keys.mode] == nil) then eval_template = t --default | |||
elseif (debug) then msg = msg .. "Ignore eval_template" .. mw.dumpObject( t ) .. "\n<br>" | |||
end | |||
end | |||
if type(e) == 'table' then | if type(e) == 'table' then | ||
local | local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=e, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays, root=false}) | ||
msg = msg .. sub_res.debug_msg | msg = msg .. sub_res.debug_msg | ||
if (type(sub_res.res) == 'table') then | if (type(sub_res.res) == 'table') then | ||
Line 182: | Line 253: | ||
end | end | ||
else | else | ||
if (eval_template ~= nil and eval_template.value ~= nil) then | |||
--evaluate single array item string as json {"self": "<value>", ".": "<value>"} => does not work since jsondata is an object | |||
--e = p.expandEmbeddedTemplates({frame=frame, jsondata={["self"]=e,["."]=e}, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays, root=false}) | |||
if (eval_template.type == "mustache" or eval_template.type == "mustache-wikitext") then | |||
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end | |||
-- {{.}} in the template will be the value of e | |||
e = lustache:render(eval_template.value, e, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion | |||
end | |||
if (eval_template.type == "mustache-wikitext") then --or eval_template.type == "wikitext") then | |||
if (debug) then msg = msg .. "Parse wikitext template " .. e .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end | |||
e = frame:preprocess( e ) | |||
end | |||
v[i] = e -- update array | |||
end | |||
if (stringify_arrays) then string_list = string_list .. e .. ";" end | if (stringify_arrays) then string_list = string_list .. e .. ";" end | ||
end | end | ||
Line 191: | Line 279: | ||
if (template == nil) then | if (template == nil and root == false) then -- don't stringify root json objects | ||
local templates = jsondata[p.keys.template] | local templates = jsondata[p.keys.template] | ||
if (templates == nil) then templates = p.defaultArg(jsonschema[p.keys.template], {}) end | if (templates == nil) then templates = p.defaultArg(jsonschema[p.keys.template], {}) end | ||
Line 203: | Line 291: | ||
end | end | ||
if template ~= nil then | if (template ~= nil and root == false) then -- don't stringify root json objects | ||
if (template.type == "wikitext") then | if (template.type == "wikitext") then | ||
for k,v in pairs(jsondata) do | for k,v in pairs(jsondata) do | ||
Line 248: | Line 336: | ||
--jsonschema = p.defaultArg(jsonschema, {}) | --jsonschema = p.defaultArg(jsonschema, {}) | ||
--jsondata = p.defaultArg(jsondata, {}) | --jsondata = p.defaultArg(jsondata, {}) | ||
if (categories == nil) then categories = jsondata[p.keys.category] end | --if (categories == nil) then categories = jsondata[p.keys.category] end -- let function param overwrite json property | ||
if (not p.nilOrEmpty(jsondata[p.keys.category])) then categories = jsondata[p.keys.category] end -- let json property overwrite function param | |||
local schema_res = p.walkJsonSchema({jsonschema=jsonschema, categories=categories, mode=mode, recursive=recursive, debug=debug}) | local schema_res = p.walkJsonSchema({jsonschema=jsonschema, template=template, categories=categories, mode=mode, recursive=recursive, debug=debug}) | ||
local expand_res = p.expandJsonRef({json=schema_res.jsonschema, debug=debug}) | |||
jsonschema = expand_res.json | |||
--mw.log(mw.text.jsonEncode(jsonschema)) | |||
local | |||
local jsonld = p.copy(jsondata) | local jsonld = p.copy(jsondata) | ||
Line 262: | Line 349: | ||
json_res_store = p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=json_data_store, mode='store'}) | json_res_store = p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=json_data_store, mode='store'}) | ||
msg = msg .. json_res_store.debug_msg | msg = msg .. json_res_store.debug_msg | ||
mw.log("JSONDATA STORE") | |||
mw.logObject(json_res_store.res) | |||
local smw_res = nil | local smw_res = nil | ||
if (mode == p.mode.header) then | if (mode == p.mode.header) then | ||
-- get the semantic properties by looking up the json keys in the json-ld context | |||
smw_res = p.getSemanticProperties({jsonschema=jsonschema, jsondata=json_res_store.res, store=false, debug=debug}) | smw_res = p.getSemanticProperties({jsonschema=jsonschema, jsondata=json_res_store.res, store=false, debug=debug}) | ||
-- store metadata where properties were defined / overridden | |||
for i, category in ipairs(schema_res.visited) do | |||
for k, v in pairs(p.defaultArgPath(schema_res.jsonschemas, {category, 'properties'}, {})) do --property section may not exisit | |||
if smw_res.definitions[k] == nil then smw_res.definitions[k] = {} end | |||
if smw_res.definitions[k]['defined_in'] == nil then smw_res.definitions[k]['defined_in'] = {} end | |||
table.insert(smw_res.definitions[k]['defined_in'], category) | |||
end | |||
end | |||
-- embed json-ld in resulting html for search engine discovery | |||
jsonld["@context"] = smw_res.context | jsonld["@context"] = smw_res.context | ||
jsonld["@type"] = p.tableMerge(p.tablefy(jsonschema.schema_type), p.tablefy(jsonld["@type"])) -- | jsonld["@type"] = p.tableMerge(p.tablefy(jsonschema.schema_type), p.tablefy(jsonld["@type"])) -- | ||
Line 275: | Line 375: | ||
if (type(v) == "string") then | if (type(v) == "string") then | ||
local vpart = p.splitString(v, ':') | local vpart = p.splitString(v, ':') | ||
if (vpart[1] == "File") then jsonld[k] = mw.getCurrentFrame():callParserFunction( 'filepath', { vpart[2] } ) end --google does not follow redirects via "File":"wiki:Special:Redirect/file/" | if (p.tableLength(vpart) == 2 and vpart[1] == "File") then jsonld[k] = mw.getCurrentFrame():callParserFunction( 'filepath', { vpart[2] } ) end --google does not follow redirects via "File":"wiki:Special:Redirect/file/" | ||
end | end | ||
end | end | ||
wikitext = wikitext .. "<div class='jsonld-header' style='display:none' data-jsonld='" .. mw.text.jsonEncode( jsonld ) .. "'></div>" | -- wikitext = wikitext .. "<div class='jsonld-header' style='display:none' data-jsonld='" .. mw.text.jsonEncode( jsonld ):gsub("'","`") .. "'></div>" | ||
end | end | ||
Line 286: | Line 386: | ||
--mw.log("JSONDATA RENDER") | --mw.log("JSONDATA RENDER") | ||
--mw.logObject(jsondata) | --mw.logObject(jsondata) | ||
local max_index = p.tableLength(schema_res.visited) | |||
for i, category in ipairs(schema_res.visited) do | for i, category in ipairs(schema_res.visited) do | ||
local | if (mode == p.mode.footer) then category = schema_res.visited[max_index - i +1] end --reverse order for footer templates | ||
local super_jsonschema = schema_res.jsonschemas[category] | |||
local template = schema_res.templates[category] | local template = schema_res.templates[category] | ||
if (template ~= nil) then | if (template ~= nil) then | ||
Line 298: | Line 399: | ||
end | end | ||
local child = frame:newChild{args=stripped_jsondata} | local child = frame:newChild{args=stripped_jsondata} | ||
if ( template:sub(1, #"=") == "=" ) then template = "\n" .. template end -- add line break if template starts with heading (otherwise not rendered by mw parser) | |||
wikitext = wikitext .. child:preprocess( template ) | wikitext = wikitext .. child:preprocess( template ) | ||
elseif (mode == p.mode.header) then | elseif (mode == p.mode.header) then | ||
local infobox_res = p.renderInfoBox({jsonschema=jsonschema, jsondata=jsondata}) | local ignore_properties = {[p.keys.category]=true} -- don't render type/category on every subclass | ||
for j, subcategory in ipairs(schema_res.visited) do | |||
if j > i then | |||
local subjsonschema = schema_res.jsonschemas[subcategory] | |||
for k, v in pairs(subjsonschema['properties']) do | |||
-- skip properties that are overwritten in subschemas, render them only once at the most specific position | |||
ignore_properties[k] = true | |||
end | |||
end | |||
end | |||
-- render the infobox for the schema itself and every super_schema using always the global json-ld context (merged within walkJsonSchema()) | |||
-- context needs to be preprocessed with buildContext() since the generic json/table merge of the @context atttribute produces a list of strings (remote context) and context objects | |||
-- context is already build in p.getSemanticProperties. schema_allOfMerged is used to provide the full schema for overridden properties | |||
local infobox_res = p.renderInfoBox({jsonschema=super_jsonschema, schema_allOfMerged=jsonschema, context=smw_res.context, property_definitions=smw_res.definitions, jsondata=jsondata, ignore_properties=ignore_properties}) | |||
wikitext = wikitext .. frame:preprocess( infobox_res.wikitext ) | wikitext = wikitext .. frame:preprocess( infobox_res.wikitext ) | ||
end | end | ||
end | end | ||
local set_categories_in_wikitext = {} | |||
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.subcategory]) --classes/categories, nil for items | |||
if (title.nsText ~= "Category") then | if (title.nsText ~= "Category") then --items | ||
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.category]) -- categories from schema type | |||
end | |||
-- Todo: Consider moving the category and this block to p.getSemanticProperties with store=true. However, settings categories with @category is only possible for subobjects | |||
if (smw_res ~= nil) then | if (smw_res ~= nil) then | ||
local display_label = p.getDisplayLabel(jsondata, smw_res.properties) | |||
if title.nsText == "Property" then display_label = p.defaultArgPath(jsondata, {p.keys.name}, display_label) end | |||
if (debug) then msg = msg .. "Store page properties" end | if (debug) then msg = msg .. "Store page properties" end | ||
smw_res.properties['Display title of'] = display_label --set special property display title | -- category handling | ||
p.tableMerge(set_categories_in_wikitext, smw_res.properties[p.keys.category_pseudoproperty]) | |||
smw_res.properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property | |||
smw_res.properties['HasOswId'] = mw.title.getCurrentTitle().fullText --set special property OswId to own title | |||
-- label and display title handling | |||
if display_label ~= nil then | |||
smw_res.properties['Display title of'] = display_label --set special property display title | |||
smw_res.properties['Display title of lowercase'] = display_label:lower() --store lowercase for case insensitive query | |||
smw_res.properties['Display title of normalized'] = display_label:lower():gsub('[^%w]+','') --store with all non-alphanumeric chars removed for normalized query | |||
end | |||
p.setNormalizedLabel(smw_res.properties) --build normalized multilang label | |||
mw.ext.displaytitle.set(display_label) | mw.ext.displaytitle.set(display_label) | ||
--smw_res.properties['@category'] = jsondata[p.keys.category] | --smw_res.properties['@category'] = jsondata[p.keys.category] | ||
Line 325: | Line 459: | ||
--wikitext = mw.dumpObject(smw_res.properties) .. wikitext | --wikitext = mw.dumpObject(smw_res.properties) .. wikitext | ||
end | end | ||
wikitext = wikitext .. "\n" .. p.setCategories({categories=set_categories_in_wikitext, sortkey=display_label}).wikitext | |||
if (debug) then mw.logObject(res) end | if (debug) then mw.logObject(res) end | ||
Line 334: | Line 469: | ||
-- test: mw.logObject(p.renderInfoBox({jsonschema=p.loadJson({title="JsonSchema:Entity"}).json, jsondata={uuid="123123"}})) | -- test: mw.logObject(p.renderInfoBox({jsonschema=p.loadJson({title="JsonSchema:Entity"}).json, jsondata={uuid="123123"}})) | ||
function p.renderInfoBox(args) | function p.renderInfoBox(args) | ||
local debug = p.defaultArg(args.debug, false) | |||
local jsondata = p.defaultArg(args.jsondata, {}) | local jsondata = p.defaultArg(args.jsondata, {}) | ||
local schema = p.defaultArg(args.jsonschema, nil) | local schema = p.defaultArg(args.jsonschema, nil) -- local schema from the perspective of the current category | ||
local | local schema_allOfMerged = p.defaultArg(args.schema_allOfMerged, schema) -- global schema with allOfs merged | ||
local property_definitions = p.defaultArg(args.property_definitions, {}) -- dict schema_key: {property: <smw_property>, ...} | |||
local res = "" | local res = "" | ||
if schema == nil then return res end | if schema == nil then return res end | ||
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context) | |||
local ignore_properties = p.defaultArg(args.ignore_properties, {}) | |||
local schema_label = "" | local schema_label = "" | ||
if schema['title'] ~= nil then schema_label = schema['title'] end | if schema['title'] ~= nil then schema_label = schema['title'] end | ||
Line 347: | Line 488: | ||
:attr( 'class', 'info_box' ) | :attr( 'class', 'info_box' ) | ||
:tag( 'tr' ) | :tag( 'tr' ) | ||
:tag( ' | :tag( 'th' ) | ||
:attr( 'class', ' | :attr( 'class', 'heading' ) | ||
:attr( 'colspan', '2' ) | :attr( 'colspan', '2' ) | ||
:wikitext( schema_label ) | :wikitext( schema_label ) | ||
for k,v in pairs(jsondata) do | for k,v in pairs(jsondata) do | ||
if (schema['properties'] ~= nil and schema['properties'][k] ~= nil and (type(v) ~= 'table' or v[1] ~= nil)) then --literal or literal array | if (not ignore_properties[k]) then | ||
if (schema['properties'] ~= nil and schema['properties'][k] ~= nil and (type(v) ~= 'table' or v[1] ~= nil)) then --literal or literal array | |||
local def = schema_allOfMerged['properties'][k] | |||
--mw.logObject(def) | |||
local label = k | |||
if def['title'] ~= nil then label = def['title'] end | |||
if def['title*'] ~= nil then -- multilang label with switch | |||
label = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. label | |||
for k,v in pairs(def['title*']) do label = label .. " |" .. k .. "=" .. v end | |||
label = label .. " }}" | |||
end | |||
local description = "" | |||
if def['description'] ~= nil then description = def['description'] end | |||
if def['description*'] ~= nil then -- multilang label with switch | |||
description = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. description | |||
for k,v in pairs(def['description*']) do description = description .. " |" .. k .. "=" .. v end | |||
description = description .. " }}" | |||
end | |||
if (p.tableLength(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) > 0) then description = description .. "<br>Definition: " end | |||
for i, c in pairs(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) do | |||
if (i > 1) then description = description .. ", " end | |||
description = description .. "[[:" ..c .. "]]" | |||
end | |||
if (description ~= "") then description = "{{#info: " .. description .. "|note }}" end -- smw tooltip | |||
label = label .. description | |||
--res = res .. title ": " .. v | |||
local cell = tbl:tag( 'tr' ) | |||
:tag( 'th' ) | |||
:wikitext( label ) | |||
:done() | |||
:tag( 'td' ) | |||
if (type(v) == 'table') then | |||
for i,e in pairs(v) do | |||
if (type(e) ~= 'table') then | |||
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value') | |||
if (p_type == '@id' and p.defaultArgPath(def, {'items', 'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then | |||
-- auto-link (OSW-)IDs if no eval_template is present | |||
e = string.gsub(e, "Category:", ":Category:") -- make sure category links work | |||
e = string.gsub(e, "File:", ":File:") -- do not embedd images but link to them | |||
e = "[[" .. e .. "]]" | |||
elseif (p_type == 'xsd:date') then -- formate date with user preferences | |||
e = "{{#dateformat:" .. e .. "|ymd}}" | |||
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences | |||
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'}) | |||
if (smw_property ~= nil) then e = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}" | |||
else | |||
local _, _, date, hours, minutes = string.find(e, "(%S+)[T ](%S+)[:](%S+)[:?]") | |||
e = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)" | |||
end | |||
elseif (type(v) == 'boolean') then | |||
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross | |||
elseif ((string.len(e) > 100) and (string.find(e, "{{") == nil) and (string.find(e, "</") == nil) and (string.find(e, "%[%[") == nil)) then -- no markup, no links | |||
e = string.sub(e, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars | |||
elseif (debug) then | |||
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'items', 'type'}, 'unknown')) | |||
mw.logObject(def) | |||
end | |||
cell:wikitext("\n* " .. e .. "") | |||
end | |||
end | |||
else | |||
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value') | |||
if (p_type == '@id' and p.defaultArgPath(def, {'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then | |||
-- auto-link (OSW-)IDs if no eval_template is present | |||
v = string.gsub(v, "Category:", ":Category:") -- make sure category links work | |||
v = string.gsub(v, "File:", ":File:") -- do not embedd images but link to them | |||
v = "[[" .. v .. "]]" | |||
elseif (p_type == 'xsd:date') then -- formate date & time with user preferences | |||
v = "{{#dateformat:" .. v .. "|ymd}}" | |||
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences | |||
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'}) | |||
if (smw_property ~= nil) then v = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}" | |||
else | |||
local _, _, date, hours, minutes = string.find(v, "(%S+)[T ](%S+)[:](%S+)[:?]") | |||
v = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)" | |||
end | |||
elseif (type(v) == 'boolean') then | |||
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross | |||
elseif ((string.len(v) > 100) and (string.find(v, "{{") == nil) and (string.find(v, "</") == nil) and (string.find(v, "%[%[") == nil)) then -- no markup, no links | |||
v = string.sub(v, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars | |||
elseif (debug) then | |||
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'type'}, 'unknown')) | |||
mw.logObject(def) | |||
end | end | ||
cell:wikitext("\n" .. v .. "") | |||
end | end | ||
end | end | ||
end | end | ||
Line 390: | Line 597: | ||
local jsonschema = p.defaultArg(args.jsonschema, {}) | local jsonschema = p.defaultArg(args.jsonschema, {}) | ||
local includeNamespace = p.defaultArg(args.includeNamespace, false) | local includeNamespace = p.defaultArg(args.includeNamespace, false) | ||
local includeSchemas = p.defaultArg(args.includeSchemas, false) | |||
local categories = {} | local categories = {} | ||
Line 396: | Line 604: | ||
--properties['@category'] = {} | --properties['@category'] = {} | ||
for k, entry in pairs(allOf) do | for k, entry in pairs(allOf) do | ||
if type(entry) == 'table' then -- "allOf": [{"$ref": "/wiki/Category:Test?action=raw"}] | local refs = nil | ||
if type(entry) == 'table' then refs = entry -- "allOf": [{"$ref": "/wiki/Category:Test?action=raw"}] | |||
else refs = {entry} end-- "allOf": {"$ref": "/wiki/Category:Test?action=raw"} | |||
for p, v in pairs(entry) do | |||
if (p == '$ref') then | |||
table.insert(categories, | for category in v:gmatch("Category:([^?]+)") do -- e.g. "/wiki/Category:Test?action=raw" | ||
if (includeNamespace) then category = "Category:" .. category end | |||
table.insert(categories, category) | |||
end | |||
if includeSchemas then | |||
for schema in v:gmatch("JsonSchema:([^?]+)") do -- e.g. "/wiki/JsonSchema:Test?action=raw" | |||
if (includeNamespace) then schema = "JsonSchema:" .. schema end | |||
table.insert(categories, schema) | |||
end | end | ||
end | end | ||
end | end | ||
end | end | ||
end | end | ||
Line 434: | Line 642: | ||
--[[ test | --[[ test | ||
category = "Category: | category = "Category:Entity" | ||
jsonschema = p.expandJsonRef({json=p.loadJson({title=category, slot="jsonschema"}).json}).json | |||
jsonschema =p. | mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true})) | ||
mw.log(mw.text.jsonEncode(p.buildContext({jsonschema=jsonschema, debug=false}).context)) | |||
or | |||
jsonschema = { | |||
["@context"]={test="level 0"}, | |||
properties={ | |||
test={ | |||
type="object", | |||
["@context"]={test1="level 1"}, | |||
properties= { | |||
test= { | |||
type="array", | |||
items= { | |||
type="object", | |||
["@context"]={test2="level 2"} | |||
} | |||
} | |||
} | |||
} | |||
} | |||
} | |||
mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true})) | mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true})) | ||
--]] | --]] | ||
-- constructs a property specific local jsonld context | |||
function p.buildContext(args) | function p.buildContext(args) | ||
local schema = p.defaultArg(args.jsonschema, {}) | local schema = p.defaultArg(args.jsonschema, {}) | ||
--mw.logObject(schema) | |||
local context = p.defaultArg(args.context, schema[p.keys.context]) | local context = p.defaultArg(args.context, schema[p.keys.context]) | ||
local result = {} | local result = p.defaultArg(args.result, {}) | ||
if (context ~= nil) then | if (context ~= nil) then | ||
for k,v in pairs(context) do | for k,v in pairs(context) do | ||
Line 449: | Line 680: | ||
elseif (type(v) == 'table' and v[1] ~= nil) then --custom addtional mappings, e. g. "type*": ["Property:HasType"] | elseif (type(v) == 'table' and v[1] ~= nil) then --custom addtional mappings, e. g. "type*": ["Property:HasType"] | ||
result[k] = v | result[k] = v | ||
elseif (type(v) == 'table' and v['@id'] == nil) then --subcontext | elseif (type(v) == 'table' and v['@id'] == nil and v['@reverse'] == nil) then --subcontext | ||
p.tableMerge(result, p.buildContext({context=v}).context) | p.tableMerge(result, p.buildContext({context=v}).context) | ||
else | else | ||
result[k] = v | result[k] = v | ||
end | end | ||
end | |||
end | |||
local properties = p.defaultArg(schema.properties, {}) | |||
-- build property context | |||
for k,v in pairs(properties) do | |||
local subcontext = nil | |||
if (p.defaultArgPath(properties, {k, 'type'}) == 'object') then | |||
--mw.logObject(properties[k]) | |||
subcontext = p.buildContext({jsonschema=properties[k]}).context | |||
elseif (p.defaultArgPath(properties, {k, 'items', 'type'}) == 'object') then | |||
--mw.logObject(properties[k]['items']) | |||
subcontext = p.buildContext({jsonschema=properties[k]['items']}).context | |||
end | |||
if (subcontext ~= nil and p.tableLength(subcontext) > 0) then | |||
if (result[k] == nil) then result[k] = {} end | |||
if (type(result[k]) == 'string') then result[k] = {["@id"]=result[k]} end | |||
if (result[k][p.keys.context] == nil) then result[k][p.keys.context] = {} end | |||
result[k][p.keys.context] = p.tableMerge(result[k][p.keys.context], subcontext) | |||
end | end | ||
end | end | ||
Line 460: | Line 710: | ||
--maps jsondata values to semantic properties by using the @context attribute within the schema | --maps jsondata values to semantic properties by using the @context attribute within the schema | ||
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | --test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:schema:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | ||
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={"some uri",{test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | --test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={"some uri",{test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | ||
--[[ | --[[ | ||
Line 485: | Line 735: | ||
local schema = p.defaultArg(args.jsonschema, {}) | local schema = p.defaultArg(args.jsonschema, {}) | ||
local subschema = p.defaultArg(args.subschema, schema) | local subschema = p.defaultArg(args.subschema, schema) | ||
local parent_schema_property = p.defaultArg(args.parent_schema_property, {}) | local parent_schema_property = p.defaultArg(args.parent_schema_property, {}) -- ToDo: Not used except in getSemanticQuery => remove | ||
local store = p.defaultArg(args.store, false) | local store = p.defaultArg(args.store, false) | ||
local root = p.defaultArg(args.root, true) | local root = p.defaultArg(args.root, true) | ||
local properties = p.defaultArg(args.properties, {}) --semantic properties to store, dict key=property_name, value=array of string values | |||
local debug = p.defaultArg(args.debug, false) | local debug = p.defaultArg(args.debug, false) | ||
--if (debug) then mw.logObject("Call getSemanticProperties with args " .. mw.dumpObject( args ) .. "\n<br>") end | --if (debug) then mw.logObject("Call getSemanticProperties with args " .. mw.dumpObject( args ) .. "\n<br>") end | ||
local | local subjectId = mw.title.getCurrentTitle().fullText | ||
local subobjectId = nil | |||
if (root == false and jsondata['uuid'] ~= nil) then | |||
subobjectId = "OSW" .. string.gsub(jsondata['uuid'], "-", "") | |||
subjectId = subjectId .. '#' .. subobjectId | |||
end | |||
local property_data = {} | local property_data = {} | ||
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context) | local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context) | ||
local error = "" | local error = "" | ||
if (debug) then mw.logObject(context) end | if (debug) then mw.logObject(context) end | ||
Line 507: | Line 764: | ||
for k,v in pairs(jsondata) do | for k,v in pairs(jsondata) do | ||
local property_names = {} | local property_names = {} | ||
local subobject_properties = {} -- reverse properties to store in the subobject | |||
local mapping_found = false | local mapping_found = false | ||
local property_definitions = {} | local property_definitions = {} -- list of objects {id=..., reverse=...} | ||
for term, def in pairs(context) do | for term, def in pairs(context) do | ||
local term_parts = p.splitString(term, "*") | local term_parts = p.splitString(term, "*") | ||
if ( | if (term_parts[1] == k) then --custom additional mapping term*(*...): "Property:..." | ||
table.insert(property_definitions, def) | if type(def) == 'table' then | ||
-- note: json-ld allows only @id OR @reverse | |||
if (def["@id"] ~= nil) then table.insert(property_definitions, {id=def["@id"], reverse=false}) end | |||
if (def["@reverse"] ~= nil) then table.insert(property_definitions, {id=def["@reverse"], reverse=true}) end | |||
else table.insert(property_definitions, {id=def}) end | |||
end | end | ||
end | end | ||
if (debug) then mw.logObject(property_definitions) end | if (debug) then mw.logObject(property_definitions) end | ||
for i,e in ipairs(property_definitions) do | for i,e in ipairs(property_definitions) do | ||
local property_definition = p.splitString( | local id = e["id"] | ||
local property_definition = p.splitString(id, ':') | |||
if property_definition[1] == p.keys.property_ns_prefix then | if property_definition[1] == p.keys.property_ns_prefix then | ||
mapping_found = true | mapping_found = true | ||
table.insert(property_names, | property_name = string.gsub(id, p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url | ||
if (e["reverse"]) then -- reverse properties are handled in the respective subobject | |||
if (subobject_properties[property_name] == nil) then subobject_properties[property_name] = {} end --initialize empty list | |||
table.insert(subobject_properties[property_name], subjectId) -- add triple subobject -property-> subject | |||
else table.insert(property_names, property_name) end | |||
local schema_property = p.defaultArg(schema_properties[k], {}) | local schema_property = p.defaultArg(schema_properties[k], {}) | ||
local schema_type = p.defaultArg(schema_property.type, nil) --todo: also load smw property type on demand | local schema_type = p.defaultArg(schema_property.type, nil) --todo: also load smw property type on demand | ||
property_data[k] = {schema_type=schema_type, schema_data=schema_property, property= | property_data[k] = {schema_type=schema_type, schema_data=schema_property, property=property_name, value=v, reverse=e["reverse"]} | ||
end | end | ||
end | end | ||
Line 536: | Line 800: | ||
--if (debug) then mw.logObject("prop " .. k .. " = " .. mw.dumpObject(v)) end | --if (debug) then mw.logObject("prop " .. k .. " = " .. mw.dumpObject(v)) end | ||
if (mapping_found) then | if (mapping_found) then | ||
local subcontext = p.copy(p.defaultArgPath(context, {k, p.keys.context}, {})) --deepcopy, see also https://phabricator.wikimedia.org/T269990 | |||
context = p.tableMerge(context, subcontext) -- pull up nested context | |||
local values = {} | local values = {} | ||
if (v[1] == nil) then --key value array = object/dict | if (p.tableLength(v) > 0 and v[1] == nil) then --key value array = object/dict => subobject | ||
local | local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=v, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]}) | ||
local id = subproperties_res.id --subobject_id | |||
if (id ~= nil) then | if (id ~= nil) then | ||
id = mw.title.getCurrentTitle().fullText .. '#' .. id | id = mw.title.getCurrentTitle().fullText .. '#' .. id | ||
table.insert(values, id) | table.insert(values, id) | ||
end | end | ||
properties = p.processStatement({subject=properties, statement=subproperties_res.properties, debug=debug}).subject | |||
else --list array | else --list array | ||
for i, e in pairs(v) do | for i, e in pairs(v) do | ||
if (type(e) == 'table') then | if (type(e) == 'table') then | ||
local | local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=e, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]}) | ||
local id = subproperties_res.id --subobject_id | |||
if (id ~= nil) then | if (id ~= nil) then | ||
id = mw.title.getCurrentTitle().fullText .. '#' .. id | id = mw.title.getCurrentTitle().fullText .. '#' .. id | ||
table.insert(values, id) | table.insert(values, id) | ||
end | end | ||
properties = p.processStatement({subject=properties, statement=subproperties_res.properties, debug=debug}).subject | |||
else values = v end --plain strings | else values = v end --plain strings | ||
end | end | ||
Line 574: | Line 843: | ||
end | end | ||
local store_res = nil | local store_res = nil | ||
if (store) then | if (store) then | ||
properties['HasOswId'] = subjectId | |||
if (root) then | if (root) then | ||
if (debug) then mw.logObject("Store page properties") end | if (debug) then mw.logObject("Store page properties") end | ||
store_res = mw.smw.set( properties ) --store as semantic properties | store_res = mw.smw.set( properties ) --store as semantic properties | ||
else | else | ||
properties['@category'] = {} | |||
p.tableMerge(properties['@category'], jsondata[p.keys.category]) -- from json property 'type' | |||
p.tableMerge(properties['@category'], properties[p.keys.category_pseudoproperty]) -- from json-ld context 'Property:Category' | |||
properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property | |||
local display_label = p.getDisplayLabel(jsondata, properties) | |||
properties[' | if properties['Display title of'] == nil and properties['Display_title_of'] == nil then | ||
if (display_label ~= nil and display_label ~= "") then properties['Display title of'] = display_label | |||
else properties['Display title of'] = p.defaultArg(subschema['title'], "") end -- fall back to property name in schema | |||
end | |||
p.setNormalizedLabel(properties) --build normalized multilang label | |||
if (p.tableLength(properties) > 0) then | if (p.tableLength(properties) > 0) then | ||
store_res = mw.smw.subobject( properties, subobjectId ) --store as subobject | store_res = mw.smw.subobject( properties, subobjectId ) --store as subobject | ||
if (debug) then mw.logObject("Store subobject with id " .. subobjectId) end | if (debug) then mw.logObject("Store subobject with id " .. (subobjectId or "<random>")) end | ||
end | end | ||
end | end | ||
Line 599: | Line 873: | ||
if (debug) then mw.logObject(error) end | if (debug) then mw.logObject(error) end | ||
return {properties=properties, definitions=property_data, id=subobjectId, context=context, error=error} | return {properties=properties, definitions=property_data, id=subobjectId, context=context, error=error} | ||
end | |||
function p.processStatement(args) | |||
local statement = p.defaultArg(args.statement) | |||
local subject = p.defaultArg(args.subject) | |||
local debug = p.defaultArg(args.debug, false) | |||
-- handle "approved" statements | |||
if (statement["HasSubject"] == nil or statement["HasSubject"][1] == nil or statement["HasSubject"][1] == "") then --implicit subject | |||
if (statement["HasProperty"] ~= nil and statement["HasProperty"][1] ~= nil and statement["HasProperty"][1] ~= "" and statement["HasObject"] ~= nil) then | |||
local property = string.gsub(statement["HasProperty"][1], p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url | |||
if (debug) then | |||
mw.log("Set property " .. property .. " from statement to ") | |||
mw.logObject(statement["HasObject"]) | |||
end | |||
if (subject[property] == nil) then subject[property] = {} end | |||
for k, v in pairs(statement["HasObject"]) do table.insert(subject[property], v) end | |||
end | |||
end | |||
return {subject=subject} | |||
end | end | ||
Line 647: | Line 941: | ||
-- HELPERS | -- HELPERS | ||
-- expands all $ref | |||
--test: mw.logObject(p.expandJsonRef({json={items={test="value", ["$ref"]="/wiki/JsonSchema:Label?action=raw"}}}).json) | |||
--test: mw.logObject(p.expandJsonRef({json={["$ref"]="/wiki/Category:Item?action=raw&slot=jsonschema"}}).json) | |||
--test: mw.logObject(p.expandJsonRef({json={["$ref"]="/wiki/JsonSchema:Statement?action=raw"}}).json) | |||
function p.expandJsonRef(args) | |||
local json = p.defaultArg(args.json, {}) | |||
local debug = p.defaultArg(args.debug, false) | |||
local refs = {} | |||
for k,v in pairs(json) do | |||
if (k == "$ref") then | |||
-- e. g. "/wiki/JsonSchema:Label?action=raw" or "/wiki/Category:Entity?action=raw&slot=jsonschema" | |||
if string.find(v, "#") then | |||
if (debug) then mw.logObject("Skip relative reference") end | |||
else | |||
local uri = mw.uri.new(v) | |||
local ref_title = mw.text.split(uri.path, "wiki/", true)[2] | |||
local ref_slot = uri.query["slot"] | |||
if (debug) then | |||
if (ref_slot ~= nil) then mw.logObject("Ref found with title " .. ref_title .. " and slot " .. ref_slot) | |||
else mw.logObject("Ref found with title " .. ref_title) end | |||
end | |||
local ref_json = p.loadJson({title=ref_title, slot=ref_slot}).json | |||
refs[v] = ref_json | |||
json[k] = nil | |||
end | |||
end | |||
end | |||
--mw.logObject(refs) | |||
for k,v in pairs(refs) do | |||
json = p.tableMerge(v, json) | |||
end | |||
for k,v in pairs(json) do | |||
if type(v) == "table" then | |||
json[k] = p.expandJsonRef({json=v}).json | |||
end | |||
end | |||
local result = p.copy(json) | |||
for k,v in pairs(json) do | |||
if (k == "allOf") then | |||
if (type(v) == "table" and v[1] == nil) then v = {v} end -- ensure array | |||
for i,s in pairs(v) do | |||
result = p.tableMerge(s, result) | |||
if (debug) then mw.log("merge allOf with title " .. s["title"]) end | |||
end | |||
result[k] = nil | |||
end | |||
end | |||
return {json=result} | |||
end | |||
function p.defaultArg(arg, default) | function p.defaultArg(arg, default) | ||
if (arg == nil) then | if (arg == nil) then | ||
Line 724: | Line 1,072: | ||
--test: mw.logObject(p.tableMerge({"string", test1="test1", subtable1={"test"}}, {"string2", test1="test2", test3="test4"})) | --test: mw.logObject(p.tableMerge({"string", test1="test1", subtable1={"test"}}, {"string2", test1="test2", test3="test4"})) | ||
function p.tableMerge(t1, t2) | function p.tableMerge(t1, t2) | ||
if (t1 == nil) then t1 = {} elseif (type(t1) ~= 'table') then t1 = {t1} end | |||
if (t2 == nil) then t2 = {} elseif (type(t2) ~= 'table') then t2 = {t2} end | |||
for k,v in pairs(t2) do | for k,v in pairs(t2) do | ||
if type(v) == "table" then | if type(v) == "table" then | ||
Line 749: | Line 1,099: | ||
for k, v in pairs(obj) do res[p.copy(k, s)] = p.copy(v, s) end | for k, v in pairs(obj) do res[p.copy(k, s)] = p.copy(v, s) end | ||
return res | return res | ||
end | |||
-- get normalized label | |||
function p.getDisplayLabel(jsondata, properties) | |||
local display_label = nil | |||
-- check if label properties are mapped | |||
if (properties["HasLabel"] ~= nil and properties["HasLabel"][1] ~= nil) then display_label = p.splitString(properties["HasLabel"][1], '@')[1] | |||
elseif (properties["HasName"] ~= nil) then | |||
if type(properties["HasName"]) == 'table' then display_label = properties["HasName"][1] | |||
else display_label = properties["HasName"] end | |||
-- fall back to unmapped keywords | |||
elseif (jsondata[p.keys.label] ~= nil and jsondata[p.keys.label][1] ~= nil) then display_label = p.splitString(jsondata[p.keys.label][1], '@')[1] | |||
elseif (jsondata[p.keys.name] ~= nil) then display_label = jsondata[p.keys.name] | |||
end | |||
return display_label | |||
end | |||
-- build normalized multilang label | |||
function p.setNormalizedLabel(properties, use_fallbacks) | |||
if (use_fallbacks == nil) then use_fallbacks = true end | |||
if (properties['HasLabel'] ~= nil) then | |||
labels = properties['HasLabel'] | |||
if(type(labels) ~= 'table') then labels = {labels} end | |||
properties['HasNormalizedLabel'] = {} | |||
for i, label in ipairs(labels) do | |||
label_norm = p.splitString(label, '@')[1]:lower():gsub('[^%w]+','') | |||
label_lang = "en" | |||
if (p.splitString(label, '@')[2] ~= nil) then label_lang = p.splitString(label, '@')[2] end | |||
table.insert(properties['HasNormalizedLabel'], label_norm .. "@" .. label_lang) | |||
end | |||
elseif (use_fallbacks and properties['HasName'] ~= nil) then -- fallback, assume English lang | |||
labels = properties['HasName'] | |||
if(type(labels) ~= 'table') then labels = {labels} end | |||
properties['HasNormalizedLabel'] = {} | |||
for i, label in ipairs(labels) do | |||
label_norm = label:lower():gsub('[^%w]+','') | |||
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en") | |||
end | |||
elseif (use_fallbacks and properties['Display title of'] ~= nil) then -- fallback, assume English lang | |||
labels = properties['Display title of'] | |||
if(type(labels) ~= 'table') then labels = {labels} end | |||
properties['HasNormalizedLabel'] = {} | |||
for i, label in ipairs(labels) do | |||
label_norm = label:lower():gsub('[^%w]+','') | |||
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en") | |||
end | |||
end | |||
end | end | ||
return p | return p |
Revision as of 17:04, 21 November 2024
Documentation for this module may be created at Module:MwJson/doc
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSW7d7193567ea14e4e89b74de88983b718", slot="jsondata"}).json, debug=true, mode="header"}))
local lustache = require("Module:Lustache")
local p = {} --p stands for package
p.keys = { --jsonschema / json-ld keys
category='type',
category_pseudoproperty='Category', -- Property:Category
subcategory='subclass_of',
schema_type='schema_type',
property_ns_prefix='Property',
schema='osl_schema',
template='eval_template',
mode='mode',
context='@context',
allOf='allOf',
label='label',
name='name',
description='description',
text='text',
debug='_debug'
}
p.slots = { --slot names
main='main',
jsondata='jsondata',
jsonschema='jsonschema',
header_template='header_template',
footer_template='footer_template',
data_template='data_template'
}
p.mode = {
header='header',
footer='footer',
query='query'
}
p.cache = {}
--loads json from a wiki page
--test: mw.logObject(p.loadJson({title="JsonSchema:Entity"}))
--test: mw.logObject(p.loadJson({title="Category:Entity", slot="jsonschema"}))
function p.loadJson(args)
local page_title = p.defaultArg(args.title, "JsonSchema:Entity") --for testing
local slot = p.defaultArg(args.slot, 'main')
local debug = p.defaultArg(args.debug, nil)
local msg = ""
local json = {}
if p.cache[page_title] ~= nil then
if p.cache[page_title][slot] ~= nil then
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. " from cache <br>" end
json = p.cache[page_title][slot]
return {json=json, debug_msg=msg}
end
else p.cache[page_title] = {}
end
if (slot == 'main') then
--json = mw.loadJsonData( "JsonSchema:Entity" ) --requires MediaWiki 1.39
local page = mw.title.makeTitle(p.splitString(page_title, ':')[1], p.splitString(page_title, ':')[2])
local text = page:getContent()
if (text ~= nil) then json = mw.text.jsonDecode(text) end
else
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. "<br>" end
local text = mw.slots.slotContent( slot , page_title )
if (text ~= nil) then json = mw.text.jsonDecode(text) end
end
local generated_content = json["$defs"] and json["$defs"]["generated"]
if generated_content then
-- Check if "$ref": "#/$defs/generated" exists directly in the table
if json["$ref"] == "#/$defs/generated" then
json = p.tableMerge(p.copy(generated_content), json)
json["$ref"] = nil -- Remove the reference after merging
end
-- Check if "$ref": "#/$defs/generated" is contained in "allOf"
if json["allOf"] then
for _, item in ipairs(json["allOf"]) do
if item["$ref"] == "#/$defs/generated" then
-- Remove the reference after merging
for i, v in ipairs(json["allOf"]) do
if v["$ref"] == "#/$defs/generated" then
table.remove(json["allOf"], i)
break
end
end
json = p.tableMerge(p.copy(generated_content), json)
break
end
end
end
json["$defs"]["generated"] = nil
end
--[[local defs = p.defaultArgPath(json, {"$defs", "generated"}, nil)
if defs == nil then defs = p.defaultArgPath(json, {"definitions", "generated"}, nil) end
if defs ~= nil then
json = p.tableMerge(p.copy(defs), json)
json["allOf"] = p.tableMerge(json["allOf"], p.copy(defs["allOf"]))
end]]--
--mw.logObject(json)
p.cache[page_title][slot] = json
return {json=json, debug_msg=msg}
end
-- test: mw.logObject(p.walkJsonSchema({jsonschema=p.loadJson({title="Category:Hardware", slot="jsonschema"}).json, debug=true}).jsonschema)
function p.walkJsonSchema(args)
local jsonschema = p.defaultArg(args.jsonschema, {})
local jsonschemas = p.defaultArg(args.jsonschemas, {})
local categories = p.defaultArg(args.categories, nil)
local visited = p.defaultArg(args.visited, {})
local mode = p.defaultArg(args.mode, p.mode.header)
--local merged_jsonschema = p.defaultArg(args.merged_jsonschema, {})
local template = p.defaultArg(args.template, nil)
local templates = p.defaultArg(args.templates, {})
local recursive = p.defaultArg(args.recursive, true)
local root = p.defaultArg(args.root, true)
local debug = p.defaultArg(args.debug, false)
local msg = ""
local wikitext = ""
local category_template_slot = nil
if (mode == p.mode.footer) then category_template_slot = p.slots.footer_template end
if (mode == p.mode.header) then category_template_slot = p.slots.header_template end
if (categories == nil) then categories = p.getCategories({jsonschema=jsonschema, includeNamespace=true, includeSchemas=true}).categories end
if (type(categories) ~= 'table') then categories = {categories} end
if (debug) then msg = msg .. "Supercategories: " .. mw.dumpObject(categories) .. "\n<br>" end
for k, category in pairs(categories) do
if (not p.tableContains(visited, category)) then
--mw.logObject("Visit " .. category)
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsonschema .. " from page " .. category .. "\n<br>" end
local super_jsonschema = nil
if p.splitString(category, ':')[1] == "JsonSchema" then super_jsonschema = p.loadJson({title=category, slot=p.slots.main}).json
else super_jsonschema = p.loadJson({title=category, slot=p.slots.jsonschema}).json end
mw.logObject("INSERT")
mw.logObject(super_jsonschema)
if (super_jsonschema ~= nil) then
if (recursive) then
local res = p.walkJsonSchema({jsonschema=super_jsonschema, jsonschemas=jsonschemas, templates=templates, mode=mode, visited=visited, root=false})
wikitext = wikitext .. res.wikitext
end
--table.insert(jsonschemas, mw.text.jsonDecode( super_jsonschema_str )) --keep a copy of the schema, super_jsonschema passed by references gets modified
--table.insert(jsonschemas, super_jsonschema )
--mw.logObject("Store " .. category)
table.insert(visited, category)
jsonschemas[category] = p.copy( super_jsonschema ) --keep a copy of the schema, super_jsonschema passed by references gets modified
--jsonschema = p.tableMerge(jsonschema, super_jsonschema) --merge superschema is done by the caller
end
if (debug) then msg = msg .. "Fetch slot " .. category_template_slot .. " from page " .. category .. "\n<br>" end
templates[category] = mw.slots.slotContent( category_template_slot , category )
end
end
if (root and p.tableLength(jsonschema) > 0) then
table.insert(visited, "_") -- dummy category for own schema
jsonschemas["_"] = p.copy(jsonschema)
templates["_"] = template
end
if (root) then
for i, category in ipairs(visited) do
--merge all schemas. we need to make a copy here, otherwise jsonschemas["Category:Entity"] contains the merged schema
jsonschema = p.copy(p.tableMerge(jsonschema, jsonschemas[category]))
end
end
if (debug) then wikitext = msg .. wikitext end
return {jsonschema=jsonschema, jsonschemas=jsonschemas, templates=templates, visited=visited, wikitext=wikitext}
end
--[[ test:
category = "Category:Hardware"
page = "Item:OSW7d7193567ea14e4e89b74de88983b718"
category2 = "Category:OSW80e240a2e17d4ae5adfe6419051aa0bb"
page2 = "Item:OSWa4da6664aeac466a86b09e6b32a1cb41"
mw.logObject(p.expandEmbeddedTemplates({
jsonschema=p.walkJsonSchema({jsonschema=p.loadJson({title=category, slot="jsonschema"}).json, debug=true}).jsonschema,
jsondata=p.loadJson({title=page, slot="jsondata"}).json,
debug=true, mode="render"
}).res)
--]]
function p.expandEmbeddedTemplates(args)
local frame = p.defaultArg(args.frame, mw.getCurrentFrame())
local jsondata = p.defaultArg(args.jsondata, {})
local jsonschema = p.defaultArg(args.jsonschema, {})
local template = p.defaultArg(args.template, nil)
local mode = p.defaultArg(args.mode, nil)
local stringify_arrays = p.defaultArg(args.stringify_arrays, false)
local msg = ""
local res = p.defaultArg(args.jsondata, "")
local root = p.defaultArg(args.root, true) -- first entry into recursion
for k,v in pairs(jsondata) do
local eval_template = nil
local eval_templates = p.defaultArgPath(jsonschema, {"properties", k, p.keys.template}, {})
if (eval_templates[1] == nil) then eval_templates = {eval_templates} end --ensure list of objects
for i, t in pairs(eval_templates) do
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then eval_template = t --use only render templates in render mode and store templates in store mode
elseif (t[p.keys.mode] == nil) then eval_template = t --default
elseif (debug) then msg = msg .. "Ignore eval_template" .. mw.dumpObject( t ) .. "\n<br>"
end
end
if (eval_template ~= nil and eval_template.value ~= nil and (eval_template.type == "mustache" or eval_template.type == "mustache-wikitext")) then
-- mustache can handle objects and array to we can parse it directly
-- todo: handle nested templates
local template_param = {[k]=v}
if (eval_template.root_key == false) then template_param = v end
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( template_param ) .. "\n<br>" end
jsondata[k] = lustache:render(eval_template.value, template_param, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion
if (eval_template.type == "mustache-wikitext") then
jsondata[k] = frame:preprocess( jsondata[k] )
end
elseif type(v) == 'table' then
if (p.tableLength(v) > 0 and v[1] == nil) then --key value array = object/dict
local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=v, jsonschema=p.defaultArgPath(jsonschema, {"properties", k}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays, root=false})
msg = msg .. sub_res.debug_msg
jsondata[k] = sub_res.res
--if (sub_res.unparsed ~= nil) then jsondata[k] = sub_res.unparsed else jsondata[k] = sub_res.wikitext end
else --list array
local string_list = ""
for i,e in pairs(v) do
local eval_template = nil
local eval_templates = p.defaultArgPath(jsonschema, {"properties", k, "items", p.keys.template}, {})
if (eval_templates[1] == nil) then eval_templates = {eval_templates} end --ensure list of objects
for i, t in pairs(eval_templates) do
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then eval_template = t --use only render templates in render mode and store templates in store mode
elseif (t[p.keys.mode] == nil) then eval_template = t --default
elseif (debug) then msg = msg .. "Ignore eval_template" .. mw.dumpObject( t ) .. "\n<br>"
end
end
if type(e) == 'table' then
local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=e, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays, root=false})
msg = msg .. sub_res.debug_msg
if (type(sub_res.res) == 'table') then
if (debug) then msg = msg .. "Values for " .. k .. " contains non-literal items: " .. mw.dumpObject( sub_res.res ) .. " => skip value in wikitemplate array param creation\n<br>" end
else
if (stringify_arrays) then string_list = string_list .. sub_res.res .. ";"
else v[i] = sub_res.res end
end
else
if (eval_template ~= nil and eval_template.value ~= nil) then
--evaluate single array item string as json {"self": "<value>", ".": "<value>"} => does not work since jsondata is an object
--e = p.expandEmbeddedTemplates({frame=frame, jsondata={["self"]=e,["."]=e}, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays, root=false})
if (eval_template.type == "mustache" or eval_template.type == "mustache-wikitext") then
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end
-- {{.}} in the template will be the value of e
e = lustache:render(eval_template.value, e, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion
end
if (eval_template.type == "mustache-wikitext") then --or eval_template.type == "wikitext") then
if (debug) then msg = msg .. "Parse wikitext template " .. e .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end
e = frame:preprocess( e )
end
v[i] = e -- update array
end
if (stringify_arrays) then string_list = string_list .. e .. ";" end
end
end
if (stringify_arrays) then jsondata[k] = string_list end
end
end
end
if (template == nil and root == false) then -- don't stringify root json objects
local templates = jsondata[p.keys.template]
if (templates == nil) then templates = p.defaultArg(jsonschema[p.keys.template], {}) end
if (templates[1] == nil) then templates = {templates} end --ensure list of objects
for i, t in pairs(templates) do
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then template = t --use only render templates in render mode and store templates in store mode
elseif (t[p.keys.mode] == nil) then template = t --default
elseif (debug) then msg = msg .. "Ignore template" .. mw.dumpObject( t ) .. "\n<br>"
end
end
end
if (template ~= nil and root == false) then -- don't stringify root json objects
if (template.type == "wikitext") then
for k,v in pairs(jsondata) do
if type(v) == 'table' then
if (debug) then msg = msg .. "Values for " .. k .. " contains non-literals: " .. mw.dumpObject( v ) .. " => skip wikitemplate parsing\n<br>" end
return {res=res, debug_msg=msg}
end --not supported
end
if (template.value ~= nil) then
if (debug) then msg = msg .. "Parse wikitemplate " .. template.value .. " with params " .. mw.dumpObject( jsondata ) .. "\n<br>" end
local child = frame:newChild{args=jsondata}
res = child:preprocess( template.value )
elseif (template.page ~= nil) then
if (debug) then msg = msg .. "Parse wikitemplate " .. template.page .. " with params " .. mw.dumpObject( jsondata ) .. "\n<br>" end
res = frame:expandTemplate{ title = template.page, args = jsondata }
end
end
end
--if (debug) then mw.logObject(msg) end
return {res=res, debug_msg=msg}
end
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSW7d7193567ea14e4e89b74de88983b718", slot="jsondata"}).json, debug=true, mode="header"}))
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSWa4da6664aeac466a86b09e6b32a1cb41", slot="jsondata"}).json, debug=true, mode="header"}))
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Category:OSWb3022bbf7e7146eb8e6f6e3264f50bbe", slot="jsondata"}).json, debug=true, mode="header", categories={"Category:Category"}}))
function p.processJsondata(args)
local frame = p.defaultArg(args.frame, mw.getCurrentFrame())
local jsondata = p.defaultArg(args.jsondata, {})
local jsonschema = p.defaultArg(args.jsonschema, {})
local template = p.defaultArg(args.template, nil)
local categories = p.defaultArg(args.categories, nil)
local recursive = p.defaultArg(args.recursive, true)
local mode = p.defaultArg(args.mode, p.mode.header)
local debug = p.defaultArg(args.debug, false)
local title = mw.title.getCurrentTitle()
local wikitext = ""
local msg = "" --debug msg
if (p.nilOrEmpty(jsondata) or (p.nilOrEmpty(categories) and p.nilOrEmpty(jsonschema) and p.nilOrEmpty(jsondata[p.keys.category]))) then return {wikitext=wikitext, debug_msg=msg} end --nothing to do here
--if (jsondata == nil or p.tableLength(jsondata) == 0 or (categories == nil and jsonschema == nil and jsondata[p.keys.category] == nil)) then return {wikitext=wikitext, debug_msg=msg} end --nothing to do here
--jsonschema = p.defaultArg(jsonschema, {})
--jsondata = p.defaultArg(jsondata, {})
--if (categories == nil) then categories = jsondata[p.keys.category] end -- let function param overwrite json property
if (not p.nilOrEmpty(jsondata[p.keys.category])) then categories = jsondata[p.keys.category] end -- let json property overwrite function param
local schema_res = p.walkJsonSchema({jsonschema=jsonschema, template=template, categories=categories, mode=mode, recursive=recursive, debug=debug})
local expand_res = p.expandJsonRef({json=schema_res.jsonschema, debug=debug})
jsonschema = expand_res.json
--mw.log(mw.text.jsonEncode(jsonschema))
local jsonld = p.copy(jsondata)
local json_data_store = p.copy(jsondata)
local json_data_render = p.copy(jsondata)
json_res_store = p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=json_data_store, mode='store'})
msg = msg .. json_res_store.debug_msg
mw.log("JSONDATA STORE")
mw.logObject(json_res_store.res)
local smw_res = nil
if (mode == p.mode.header) then
-- get the semantic properties by looking up the json keys in the json-ld context
smw_res = p.getSemanticProperties({jsonschema=jsonschema, jsondata=json_res_store.res, store=false, debug=debug})
-- store metadata where properties were defined / overridden
for i, category in ipairs(schema_res.visited) do
for k, v in pairs(p.defaultArgPath(schema_res.jsonschemas, {category, 'properties'}, {})) do --property section may not exisit
if smw_res.definitions[k] == nil then smw_res.definitions[k] = {} end
if smw_res.definitions[k]['defined_in'] == nil then smw_res.definitions[k]['defined_in'] = {} end
table.insert(smw_res.definitions[k]['defined_in'], category)
end
end
-- embed json-ld in resulting html for search engine discovery
jsonld["@context"] = smw_res.context
jsonld["@type"] = p.tableMerge(p.tablefy(jsonschema.schema_type), p.tablefy(jsonld["@type"])) --
jsonld['schema:name'] = p.defaultArgPath(jsonld, {p.keys.label, 1, p.keys.text}, jsonld['name']) --google does not support @value and @lang
jsonld['schema:description'] = p.defaultArgPath(jsonld, {p.keys.description, 1, p.keys.text}, nil)
for k, v in pairs(jsonld) do
if (type(v) == "string") then
local vpart = p.splitString(v, ':')
if (p.tableLength(vpart) == 2 and vpart[1] == "File") then jsonld[k] = mw.getCurrentFrame():callParserFunction( 'filepath', { vpart[2] } ) end --google does not follow redirects via "File":"wiki:Special:Redirect/file/"
end
end
-- wikitext = wikitext .. "<div class='jsonld-header' style='display:none' data-jsonld='" .. mw.text.jsonEncode( jsonld ):gsub("'","`") .. "'></div>"
end
local json_res = p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=json_data_render, mode='render'})
msg = msg .. json_res.debug_msg
jsondata =json_res.res
--mw.log("JSONDATA RENDER")
--mw.logObject(jsondata)
local max_index = p.tableLength(schema_res.visited)
for i, category in ipairs(schema_res.visited) do
if (mode == p.mode.footer) then category = schema_res.visited[max_index - i +1] end --reverse order for footer templates
local super_jsonschema = schema_res.jsonschemas[category]
local template = schema_res.templates[category]
if (template ~= nil) then
if (debug) then msg = msg .. "Parse \n\n" .. template .. " \n\nwith params " .. mw.dumpObject( jsondata ) .. "\n<br>" end
local stripped_jsondata={}
for k, v in pairs(jsondata) do
if (type(v) ~= 'table') then stripped_jsondata[k] = v end --delete object values, not supported by wiki templates
end
local child = frame:newChild{args=stripped_jsondata}
if ( template:sub(1, #"=") == "=" ) then template = "\n" .. template end -- add line break if template starts with heading (otherwise not rendered by mw parser)
wikitext = wikitext .. child:preprocess( template )
elseif (mode == p.mode.header) then
local ignore_properties = {[p.keys.category]=true} -- don't render type/category on every subclass
for j, subcategory in ipairs(schema_res.visited) do
if j > i then
local subjsonschema = schema_res.jsonschemas[subcategory]
for k, v in pairs(subjsonschema['properties']) do
-- skip properties that are overwritten in subschemas, render them only once at the most specific position
ignore_properties[k] = true
end
end
end
-- render the infobox for the schema itself and every super_schema using always the global json-ld context (merged within walkJsonSchema())
-- context needs to be preprocessed with buildContext() since the generic json/table merge of the @context atttribute produces a list of strings (remote context) and context objects
-- context is already build in p.getSemanticProperties. schema_allOfMerged is used to provide the full schema for overridden properties
local infobox_res = p.renderInfoBox({jsonschema=super_jsonschema, schema_allOfMerged=jsonschema, context=smw_res.context, property_definitions=smw_res.definitions, jsondata=jsondata, ignore_properties=ignore_properties})
wikitext = wikitext .. frame:preprocess( infobox_res.wikitext )
end
end
local set_categories_in_wikitext = {}
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.subcategory]) --classes/categories, nil for items
if (title.nsText ~= "Category") then --items
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.category]) -- categories from schema type
end
-- Todo: Consider moving the category and this block to p.getSemanticProperties with store=true. However, settings categories with @category is only possible for subobjects
if (smw_res ~= nil) then
local display_label = p.getDisplayLabel(jsondata, smw_res.properties)
if title.nsText == "Property" then display_label = p.defaultArgPath(jsondata, {p.keys.name}, display_label) end
if (debug) then msg = msg .. "Store page properties" end
-- category handling
p.tableMerge(set_categories_in_wikitext, smw_res.properties[p.keys.category_pseudoproperty])
smw_res.properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property
smw_res.properties['HasOswId'] = mw.title.getCurrentTitle().fullText --set special property OswId to own title
-- label and display title handling
if display_label ~= nil then
smw_res.properties['Display title of'] = display_label --set special property display title
smw_res.properties['Display title of lowercase'] = display_label:lower() --store lowercase for case insensitive query
smw_res.properties['Display title of normalized'] = display_label:lower():gsub('[^%w]+','') --store with all non-alphanumeric chars removed for normalized query
end
p.setNormalizedLabel(smw_res.properties) --build normalized multilang label
mw.ext.displaytitle.set(display_label)
--smw_res.properties['@category'] = jsondata[p.keys.category]
local store_res = mw.smw.set( smw_res.properties ) --store as semantic properties
if (debug) then msg = msg .. mw.dumpObject(smw_res.properties) end
if (store_res) then
if (debug) then msg = msg .. "SMW SUCCESS: " end
else
wikitext = wikitext .. store_res.error
if (debug) then msg = msg .. "SMW ERROR: " .. store_res.error end
end
--wikitext = mw.dumpObject(smw_res.properties) .. wikitext
end
wikitext = wikitext .. "\n" .. p.setCategories({categories=set_categories_in_wikitext, sortkey=display_label}).wikitext
if (debug) then mw.logObject(res) end
return {wikitext=wikitext, debug_msg=msg}
end
-- renders a default infobox
-- test: mw.logObject(p.renderInfoBox({jsonschema=p.loadJson({title="JsonSchema:Entity"}).json, jsondata={uuid="123123"}}))
function p.renderInfoBox(args)
local debug = p.defaultArg(args.debug, false)
local jsondata = p.defaultArg(args.jsondata, {})
local schema = p.defaultArg(args.jsonschema, nil) -- local schema from the perspective of the current category
local schema_allOfMerged = p.defaultArg(args.schema_allOfMerged, schema) -- global schema with allOfs merged
local property_definitions = p.defaultArg(args.property_definitions, {}) -- dict schema_key: {property: <smw_property>, ...}
local res = ""
if schema == nil then return res end
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context)
local ignore_properties = p.defaultArg(args.ignore_properties, {})
local schema_label = ""
if schema['title'] ~= nil then schema_label = schema['title'] end
-- see also: https://help.fandom.com/wiki/Extension:Scribunto/HTML_Library_usage_notes
local tbl = mw.html.create( 'table' )
tbl
:attr( 'class', 'info_box' )
:tag( 'tr' )
:tag( 'th' )
:attr( 'class', 'heading' )
:attr( 'colspan', '2' )
:wikitext( schema_label )
for k,v in pairs(jsondata) do
if (not ignore_properties[k]) then
if (schema['properties'] ~= nil and schema['properties'][k] ~= nil and (type(v) ~= 'table' or v[1] ~= nil)) then --literal or literal array
local def = schema_allOfMerged['properties'][k]
--mw.logObject(def)
local label = k
if def['title'] ~= nil then label = def['title'] end
if def['title*'] ~= nil then -- multilang label with switch
label = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. label
for k,v in pairs(def['title*']) do label = label .. " |" .. k .. "=" .. v end
label = label .. " }}"
end
local description = ""
if def['description'] ~= nil then description = def['description'] end
if def['description*'] ~= nil then -- multilang label with switch
description = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. description
for k,v in pairs(def['description*']) do description = description .. " |" .. k .. "=" .. v end
description = description .. " }}"
end
if (p.tableLength(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) > 0) then description = description .. "<br>Definition: " end
for i, c in pairs(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) do
if (i > 1) then description = description .. ", " end
description = description .. "[[:" ..c .. "]]"
end
if (description ~= "") then description = "{{#info: " .. description .. "|note }}" end -- smw tooltip
label = label .. description
--res = res .. title ": " .. v
local cell = tbl:tag( 'tr' )
:tag( 'th' )
:wikitext( label )
:done()
:tag( 'td' )
if (type(v) == 'table') then
for i,e in pairs(v) do
if (type(e) ~= 'table') then
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value')
if (p_type == '@id' and p.defaultArgPath(def, {'items', 'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then
-- auto-link (OSW-)IDs if no eval_template is present
e = string.gsub(e, "Category:", ":Category:") -- make sure category links work
e = string.gsub(e, "File:", ":File:") -- do not embedd images but link to them
e = "[[" .. e .. "]]"
elseif (p_type == 'xsd:date') then -- formate date with user preferences
e = "{{#dateformat:" .. e .. "|ymd}}"
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'})
if (smw_property ~= nil) then e = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}"
else
local _, _, date, hours, minutes = string.find(e, "(%S+)[T ](%S+)[:](%S+)[:?]")
e = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)"
end
elseif (type(v) == 'boolean') then
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross
elseif ((string.len(e) > 100) and (string.find(e, "{{") == nil) and (string.find(e, "</") == nil) and (string.find(e, "%[%[") == nil)) then -- no markup, no links
e = string.sub(e, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars
elseif (debug) then
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'items', 'type'}, 'unknown'))
mw.logObject(def)
end
cell:wikitext("\n* " .. e .. "")
end
end
else
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value')
if (p_type == '@id' and p.defaultArgPath(def, {'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then
-- auto-link (OSW-)IDs if no eval_template is present
v = string.gsub(v, "Category:", ":Category:") -- make sure category links work
v = string.gsub(v, "File:", ":File:") -- do not embedd images but link to them
v = "[[" .. v .. "]]"
elseif (p_type == 'xsd:date') then -- formate date & time with user preferences
v = "{{#dateformat:" .. v .. "|ymd}}"
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'})
if (smw_property ~= nil) then v = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}"
else
local _, _, date, hours, minutes = string.find(v, "(%S+)[T ](%S+)[:](%S+)[:?]")
v = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)"
end
elseif (type(v) == 'boolean') then
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross
elseif ((string.len(v) > 100) and (string.find(v, "{{") == nil) and (string.find(v, "</") == nil) and (string.find(v, "%[%[") == nil)) then -- no markup, no links
v = string.sub(v, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars
elseif (debug) then
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'type'}, 'unknown'))
mw.logObject(def)
end
cell:wikitext("\n" .. v .. "")
end
end
end
end
res = res .. tostring( tbl )
--mw.logObject(res)
return {wikitext=res}
end
-- test
-- mw.logObject(p.getCategories({jsonschema={allOf={["$ref"]="/wiki/Category:Test?action=raw&slot=jsonschema"}}, includeNamespace=true}))
-- mw.logObject(p.getCategories({jsonschema={allOf={{["$ref"]="/wiki/Category:Test?action=raw&slot=jsonschema"}, {["$ref"]="/wiki/Category:Test2?action=raw&slot=jsonschema"}}}}))
function p.getCategories(args)
local jsonschema = p.defaultArg(args.jsonschema, {})
local includeNamespace = p.defaultArg(args.includeNamespace, false)
local includeSchemas = p.defaultArg(args.includeSchemas, false)
local categories = {}
local allOf = jsonschema[p.keys.allOf]
if (allOf ~= nil) then
--properties['@category'] = {}
for k, entry in pairs(allOf) do
local refs = nil
if type(entry) == 'table' then refs = entry -- "allOf": [{"$ref": "/wiki/Category:Test?action=raw"}]
else refs = {entry} end-- "allOf": {"$ref": "/wiki/Category:Test?action=raw"}
for p, v in pairs(entry) do
if (p == '$ref') then
for category in v:gmatch("Category:([^?]+)") do -- e.g. "/wiki/Category:Test?action=raw"
if (includeNamespace) then category = "Category:" .. category end
table.insert(categories, category)
end
if includeSchemas then
for schema in v:gmatch("JsonSchema:([^?]+)") do -- e.g. "/wiki/JsonSchema:Test?action=raw"
if (includeNamespace) then schema = "JsonSchema:" .. schema end
table.insert(categories, schema)
end
end
end
end
end
end
return {categories=categories}
end
--sets a list of categories on the page
--test: mw.logObject(p.setCategories({categories={"Cat1", "Category:Cat2"}}))
function p.setCategories(args)
local categories = p.defaultArg(args.categories, {})
local sortkey = p.defaultArg(args.sortkey, "")
if (sortkey ~= "") then sortkey = "|" .. sortkey end
if (type(categories) ~= 'table') then categories = {categories} end
local res = ""
for k, entry in pairs(categories) do
res = res .. "[[Category:" .. string.gsub(entry, "Category:", "") .. sortkey .."]]"
end
return {wikitext=res}
end
--[[ test
category = "Category:Entity"
jsonschema = p.expandJsonRef({json=p.loadJson({title=category, slot="jsonschema"}).json}).json
mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true}))
mw.log(mw.text.jsonEncode(p.buildContext({jsonschema=jsonschema, debug=false}).context))
or
jsonschema = {
["@context"]={test="level 0"},
properties={
test={
type="object",
["@context"]={test1="level 1"},
properties= {
test= {
type="array",
items= {
type="object",
["@context"]={test2="level 2"}
}
}
}
}
}
}
mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true}))
--]]
-- constructs a property specific local jsonld context
function p.buildContext(args)
local schema = p.defaultArg(args.jsonschema, {})
--mw.logObject(schema)
local context = p.defaultArg(args.context, schema[p.keys.context])
local result = p.defaultArg(args.result, {})
if (context ~= nil) then
for k,v in pairs(context) do
if type(k) == 'number' and type(v) == 'string' then
--table.insert(result, v) --skip context imports
elseif (type(v) == 'table' and v[1] ~= nil) then --custom addtional mappings, e. g. "type*": ["Property:HasType"]
result[k] = v
elseif (type(v) == 'table' and v['@id'] == nil and v['@reverse'] == nil) then --subcontext
p.tableMerge(result, p.buildContext({context=v}).context)
else
result[k] = v
end
end
end
local properties = p.defaultArg(schema.properties, {})
-- build property context
for k,v in pairs(properties) do
local subcontext = nil
if (p.defaultArgPath(properties, {k, 'type'}) == 'object') then
--mw.logObject(properties[k])
subcontext = p.buildContext({jsonschema=properties[k]}).context
elseif (p.defaultArgPath(properties, {k, 'items', 'type'}) == 'object') then
--mw.logObject(properties[k]['items'])
subcontext = p.buildContext({jsonschema=properties[k]['items']}).context
end
if (subcontext ~= nil and p.tableLength(subcontext) > 0) then
if (result[k] == nil) then result[k] = {} end
if (type(result[k]) == 'string') then result[k] = {["@id"]=result[k]} end
if (result[k][p.keys.context] == nil) then result[k][p.keys.context] = {} end
result[k][p.keys.context] = p.tableMerge(result[k][p.keys.context], subcontext)
end
end
return {context=result}
end
--maps jsondata values to semantic properties by using the @context attribute within the schema
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:schema:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true}))
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={"some uri",{test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true}))
--[[
mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:TestProperty", subobject="Property:HasSubobject", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={
test="TestValue", myObjectProperty="123", subobject={uuid="123-123-123", test="TestValue2"}
}, debug=true}))
mw.logObject(p.getSemanticProperties({jsonschema=p.loadJson({title="Category:OSW80e240a2e17d4ae5adfe6419051aa0bb", slot="jsonschema"}).json, p.loadJson({title="Item:OSWa4da6664aeac466a86b09e6b32a1cb41", slot="jsonsdata"}).json, debug=true}))
category = "Category:Hardware"
page = "Item:OSW7d7193567ea14e4e89b74de88983b718"
category2 = "Category:OSW80e240a2e17d4ae5adfe6419051aa0bb"
page2 = "Item:OSWa4da6664aeac466a86b09e6b32a1cb41"
jsonschema =p.walkJsonSchema({jsonschema=p.loadJson({title=category, slot="jsonschema"}).json, debug=true}).jsonschema
mw.logObject(p.getSemanticProperties({
jsonschema=jsonschema,
jsondata=p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=p.loadJson({title=page, slot="jsondata"}).json}).res,
debug=true
}).properties)
--]]
function p.getSemanticProperties(args)
local jsondata = p.defaultArg(args.jsondata, {})
local schema = p.defaultArg(args.jsonschema, {})
local subschema = p.defaultArg(args.subschema, schema)
local parent_schema_property = p.defaultArg(args.parent_schema_property, {}) -- ToDo: Not used except in getSemanticQuery => remove
local store = p.defaultArg(args.store, false)
local root = p.defaultArg(args.root, true)
local properties = p.defaultArg(args.properties, {}) --semantic properties to store, dict key=property_name, value=array of string values
local debug = p.defaultArg(args.debug, false)
--if (debug) then mw.logObject("Call getSemanticProperties with args " .. mw.dumpObject( args ) .. "\n<br>") end
local subjectId = mw.title.getCurrentTitle().fullText
local subobjectId = nil
if (root == false and jsondata['uuid'] ~= nil) then
subobjectId = "OSW" .. string.gsub(jsondata['uuid'], "-", "")
subjectId = subjectId .. '#' .. subobjectId
end
local property_data = {}
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context)
local error = ""
if (debug) then mw.logObject(context) end
if schema ~= nil and context ~= nil then
local schema_properties = p.defaultArg(subschema.properties, {})
if (debug and root) then
for k,v in pairs(context) do
if type(k) == 'number' then mw.logObject("imports " .. v)
elseif type(v) == 'table' and v["@id"] ~= nil then mw.logObject("" .. k .. " maps to " .. v["@id"])
else mw.logObject("" .. k .. " maps to " .. mw.dumpObject(v)) end
end
end
for k,v in pairs(jsondata) do
local property_names = {}
local subobject_properties = {} -- reverse properties to store in the subobject
local mapping_found = false
local property_definitions = {} -- list of objects {id=..., reverse=...}
for term, def in pairs(context) do
local term_parts = p.splitString(term, "*")
if (term_parts[1] == k) then --custom additional mapping term*(*...): "Property:..."
if type(def) == 'table' then
-- note: json-ld allows only @id OR @reverse
if (def["@id"] ~= nil) then table.insert(property_definitions, {id=def["@id"], reverse=false}) end
if (def["@reverse"] ~= nil) then table.insert(property_definitions, {id=def["@reverse"], reverse=true}) end
else table.insert(property_definitions, {id=def}) end
end
end
if (debug) then mw.logObject(property_definitions) end
for i,e in ipairs(property_definitions) do
local id = e["id"]
local property_definition = p.splitString(id, ':')
if property_definition[1] == p.keys.property_ns_prefix then
mapping_found = true
property_name = string.gsub(id, p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url
if (e["reverse"]) then -- reverse properties are handled in the respective subobject
if (subobject_properties[property_name] == nil) then subobject_properties[property_name] = {} end --initialize empty list
table.insert(subobject_properties[property_name], subjectId) -- add triple subobject -property-> subject
else table.insert(property_names, property_name) end
local schema_property = p.defaultArg(schema_properties[k], {})
local schema_type = p.defaultArg(schema_property.type, nil) --todo: also load smw property type on demand
property_data[k] = {schema_type=schema_type, schema_data=schema_property, property=property_name, value=v, reverse=e["reverse"]}
end
end
for i, property_name in ipairs(property_names) do
if (properties[property_name] == nil) then properties[property_name] = {} end --initialize empty list
end
if type(v) == 'table' then
--if (debug) then mw.logObject("prop " .. k .. " = " .. mw.dumpObject(v)) end
if (mapping_found) then
local subcontext = p.copy(p.defaultArgPath(context, {k, p.keys.context}, {})) --deepcopy, see also https://phabricator.wikimedia.org/T269990
context = p.tableMerge(context, subcontext) -- pull up nested context
local values = {}
if (p.tableLength(v) > 0 and v[1] == nil) then --key value array = object/dict => subobject
local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=v, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]})
local id = subproperties_res.id --subobject_id
if (id ~= nil) then
id = mw.title.getCurrentTitle().fullText .. '#' .. id
table.insert(values, id)
end
properties = p.processStatement({subject=properties, statement=subproperties_res.properties, debug=debug}).subject
else --list array
for i, e in pairs(v) do
if (type(e) == 'table') then
local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=e, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]})
local id = subproperties_res.id --subobject_id
if (id ~= nil) then
id = mw.title.getCurrentTitle().fullText .. '#' .. id
table.insert(values, id)
end
properties = p.processStatement({subject=properties, statement=subproperties_res.properties, debug=debug}).subject
else values = v end --plain strings
end
end
for pi, property_name in ipairs(property_names) do
for i,value in pairs(values) do table.insert(properties[property_name], value) end
if (debug) then mw.logObject("set " .. property_name .. " = " .. mw.dumpObject(values)) end
end
else if (debug) then mw.logObject("not mapped: " .. k .. " = " .. mw.dumpObject(v)) end
end
else
if (mapping_found) then
for pi, property_name in ipairs(property_names) do
table.insert(properties[property_name], v)
if (debug) then mw.logObject("set " .. property_name .. " = " .. mw.dumpObject(v)) end
end
else
if (debug) then mw.logObject("not mapped: " .. k .. " = " .. mw.dumpObject(v)) end
end
end
end
end
local store_res = nil
if (store) then
properties['HasOswId'] = subjectId
if (root) then
if (debug) then mw.logObject("Store page properties") end
store_res = mw.smw.set( properties ) --store as semantic properties
else
properties['@category'] = {}
p.tableMerge(properties['@category'], jsondata[p.keys.category]) -- from json property 'type'
p.tableMerge(properties['@category'], properties[p.keys.category_pseudoproperty]) -- from json-ld context 'Property:Category'
properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property
local display_label = p.getDisplayLabel(jsondata, properties)
if properties['Display title of'] == nil and properties['Display_title_of'] == nil then
if (display_label ~= nil and display_label ~= "") then properties['Display title of'] = display_label
else properties['Display title of'] = p.defaultArg(subschema['title'], "") end -- fall back to property name in schema
end
p.setNormalizedLabel(properties) --build normalized multilang label
if (p.tableLength(properties) > 0) then
store_res = mw.smw.subobject( properties, subobjectId ) --store as subobject
if (debug) then mw.logObject("Store subobject with id " .. (subobjectId or "<random>")) end
end
end
end
if (debug) then mw.logObject(properties) end
if (store_res ~= nil) then
if (not store_res and store_res.error ~= nil) then error = error .. store_res.error end
end
if (debug) then mw.logObject(error) end
return {properties=properties, definitions=property_data, id=subobjectId, context=context, error=error}
end
function p.processStatement(args)
local statement = p.defaultArg(args.statement)
local subject = p.defaultArg(args.subject)
local debug = p.defaultArg(args.debug, false)
-- handle "approved" statements
if (statement["HasSubject"] == nil or statement["HasSubject"][1] == nil or statement["HasSubject"][1] == "") then --implicit subject
if (statement["HasProperty"] ~= nil and statement["HasProperty"][1] ~= nil and statement["HasProperty"][1] ~= "" and statement["HasObject"] ~= nil) then
local property = string.gsub(statement["HasProperty"][1], p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url
if (debug) then
mw.log("Set property " .. property .. " from statement to ")
mw.logObject(statement["HasObject"])
end
if (subject[property] == nil) then subject[property] = {} end
for k, v in pairs(statement["HasObject"]) do table.insert(subject[property], v) end
end
end
return {subject=subject}
end
-- build a semantic query based on provided properties and their schema definition
--[[ test:
mw.logObject(p.getSemanticQuery({
jsonschema={
["@context"]={
test="Property:TestProperty",
number_max="Property:HasNumber",
date_min="Property:HasDate"
},
properties={
test={title="Test", type="string"},
number_max={title="Number", type="string", format="number", options={role={query={filter="max"}}}},
date_min={title="Date", type="string", format="date", options={role={query={filter="min"}}}},
}
},
jsondata={test="TestValue", number_max=5, date_min="01.01.2023"}
}))
--]]
function p.getSemanticQuery(args)
--local jsondata = p.defaultArg(args.jsondata, {})
--local schema = p.defaultArg(args.jsonschema, {})
local res = ""
local where = ""
local select = ""
local semantic_properties = p.getSemanticProperties(args)
--mw.logObject(semantic_properties)
for k,def in pairs(semantic_properties.definitions) do
-- see also: https://www.semantic-mediawiki.org/wiki/Help:Search_operators
local filter = p.defaultArgPath(def.schema_data, {'options', 'role', 'query', 'filter'}, 'eq')
local value = def.value
if def.schema_data.type == 'string' and (def.schema_data.format == 'number' or def.schema_data.format == 'date') then
if (filter == 'min') then value = "<" .. value
elseif (filter == 'max') then value = ">" .. value
else value = value end --exact match
elseif def.schema_data.type == 'string' then
value = "~*" .. value .. "*"
end
where = where .. "\n[[".. def.property .. "::" .. value .. "]]"
select = select .. "\n|?" .. def.property
if (def.schema_data.title ~= nil) then select = select .. "=" .. def.schema_data.title end
end
if (where ~= "") then res = "{{#ask:" .. res .. where .. select .. "}}" end
return {wikitext=res}
end
-- HELPERS
-- expands all $ref
--test: mw.logObject(p.expandJsonRef({json={items={test="value", ["$ref"]="/wiki/JsonSchema:Label?action=raw"}}}).json)
--test: mw.logObject(p.expandJsonRef({json={["$ref"]="/wiki/Category:Item?action=raw&slot=jsonschema"}}).json)
--test: mw.logObject(p.expandJsonRef({json={["$ref"]="/wiki/JsonSchema:Statement?action=raw"}}).json)
function p.expandJsonRef(args)
local json = p.defaultArg(args.json, {})
local debug = p.defaultArg(args.debug, false)
local refs = {}
for k,v in pairs(json) do
if (k == "$ref") then
-- e. g. "/wiki/JsonSchema:Label?action=raw" or "/wiki/Category:Entity?action=raw&slot=jsonschema"
if string.find(v, "#") then
if (debug) then mw.logObject("Skip relative reference") end
else
local uri = mw.uri.new(v)
local ref_title = mw.text.split(uri.path, "wiki/", true)[2]
local ref_slot = uri.query["slot"]
if (debug) then
if (ref_slot ~= nil) then mw.logObject("Ref found with title " .. ref_title .. " and slot " .. ref_slot)
else mw.logObject("Ref found with title " .. ref_title) end
end
local ref_json = p.loadJson({title=ref_title, slot=ref_slot}).json
refs[v] = ref_json
json[k] = nil
end
end
end
--mw.logObject(refs)
for k,v in pairs(refs) do
json = p.tableMerge(v, json)
end
for k,v in pairs(json) do
if type(v) == "table" then
json[k] = p.expandJsonRef({json=v}).json
end
end
local result = p.copy(json)
for k,v in pairs(json) do
if (k == "allOf") then
if (type(v) == "table" and v[1] == nil) then v = {v} end -- ensure array
for i,s in pairs(v) do
result = p.tableMerge(s, result)
if (debug) then mw.log("merge allOf with title " .. s["title"]) end
end
result[k] = nil
end
end
return {json=result}
end
function p.defaultArg(arg, default)
if (arg == nil) then
return default
else
return arg
end
end
-- returns the value of a table (dict) path or default, if the path is not defined
-- test: mw.logObject(p.defaultArgPath({some={defined={path="value"}}}, {"some", "defined", "path"}, "default_value"))
-- test: mw.logObject(p.defaultArgPath({some={defined={path="value"}}}, {"some", "undefined", "path"}, "default_value"))
function p.defaultArgPath(arg, path, default)
if (arg == nil) then
return default
elseif (path == nil) then
return arg
else
key = table.remove(path,1)
if (key == nil) then return arg end --end of path
return p.defaultArgPath(arg[key], path, default)
end
end
function p.splitString(inputstr, sep)
if sep == nil then
sep = ";"
end
local t={}
for str in string.gmatch(inputstr, "([^"..sep.."]+)") do
table.insert(t, str)
end
return t
end
--dumps a table to a string (replaced by mw.dumpObject())
function p.dump(o)
return mw.dumpObject(o)
end
--converts a literal to an table
function p.tablefy(o)
if (o == nil) then o = {} end
if (type(o) ~= 'table') then o = {o} end
return o
end
--true if the value is contained in the array (flat arrays only)
function p.tableContains (tab, val)
for index, value in ipairs(tab) do
if value == val then
return true
end
end
return false
end
--get the size of a table
function p.tableLength(t)
local count = 0
for _ in pairs(t) do count = count + 1 end
return count
end
--check if a variable is nil or an empty string or table
function p.nilOrEmpty(o)
if (o == nil) then return true
elseif (type(o) == 'string' and o == "") then return true
elseif (type(o) == 'table' and p.tableLength(o) == 0) then return true
else return false
end
end
-- merges t2 to t1
--test: mw.logObject(p.tableMerge({"string", test1="test1", subtable1={"test"}}, {"string2", test1="test2", test3="test4"}))
function p.tableMerge(t1, t2)
if (t1 == nil) then t1 = {} elseif (type(t1) ~= 'table') then t1 = {t1} end
if (t2 == nil) then t2 = {} elseif (type(t2) ~= 'table') then t2 = {t2} end
for k,v in pairs(t2) do
if type(v) == "table" then
if type(t1[k] or false) == "table" then
p.tableMerge(t1[k] or {}, t2[k] or {})
else
if type(k) == 'number' then table.insert(t1, v)
else t1[k] = v end
end
else
if type(k) == 'number' then table.insert(t1, v)
else t1[k] = v end
end
end
return t1
end
-- from https://stackoverflow.com/questions/640642/how-do-you-copy-a-lua-table-by-value
function p.copy(obj, seen)
if type(obj) ~= 'table' then return obj end
if seen and seen[obj] then return seen[obj] end
local s = seen or {}
local res = setmetatable({}, getmetatable(obj))
s[obj] = res
for k, v in pairs(obj) do res[p.copy(k, s)] = p.copy(v, s) end
return res
end
-- get normalized label
function p.getDisplayLabel(jsondata, properties)
local display_label = nil
-- check if label properties are mapped
if (properties["HasLabel"] ~= nil and properties["HasLabel"][1] ~= nil) then display_label = p.splitString(properties["HasLabel"][1], '@')[1]
elseif (properties["HasName"] ~= nil) then
if type(properties["HasName"]) == 'table' then display_label = properties["HasName"][1]
else display_label = properties["HasName"] end
-- fall back to unmapped keywords
elseif (jsondata[p.keys.label] ~= nil and jsondata[p.keys.label][1] ~= nil) then display_label = p.splitString(jsondata[p.keys.label][1], '@')[1]
elseif (jsondata[p.keys.name] ~= nil) then display_label = jsondata[p.keys.name]
end
return display_label
end
-- build normalized multilang label
function p.setNormalizedLabel(properties, use_fallbacks)
if (use_fallbacks == nil) then use_fallbacks = true end
if (properties['HasLabel'] ~= nil) then
labels = properties['HasLabel']
if(type(labels) ~= 'table') then labels = {labels} end
properties['HasNormalizedLabel'] = {}
for i, label in ipairs(labels) do
label_norm = p.splitString(label, '@')[1]:lower():gsub('[^%w]+','')
label_lang = "en"
if (p.splitString(label, '@')[2] ~= nil) then label_lang = p.splitString(label, '@')[2] end
table.insert(properties['HasNormalizedLabel'], label_norm .. "@" .. label_lang)
end
elseif (use_fallbacks and properties['HasName'] ~= nil) then -- fallback, assume English lang
labels = properties['HasName']
if(type(labels) ~= 'table') then labels = {labels} end
properties['HasNormalizedLabel'] = {}
for i, label in ipairs(labels) do
label_norm = label:lower():gsub('[^%w]+','')
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en")
end
elseif (use_fallbacks and properties['Display title of'] ~= nil) then -- fallback, assume English lang
labels = properties['Display title of']
if(type(labels) ~= 'table') then labels = {labels} end
properties['HasNormalizedLabel'] = {}
for i, label in ipairs(labels) do
label_norm = label:lower():gsub('[^%w]+','')
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en")
end
end
end
return p