blob: b14055341a0d547695d95b651d93d000ffe25d6f [file] [log] [blame]
#!/usr/bin/env node
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
import fs from 'fs-extra';
import snarkdown from 'snarkdown';
const OUTPUT_FILE = 'lib/sql-docs.ts';
const MINIMUM_EXPECTED_NUMBER_OF_FUNCTIONS = 198;
const MINIMUM_EXPECTED_NUMBER_OF_DATA_TYPES = 15;
const initialFunctionDocs = {
TABLE: [['external', convertMarkdownToHtml('Defines a logical table from an external.')]],
EXTERN: [
['inputSource, inputFormat, rowSignature?', convertMarkdownToHtml('Reads external data.')],
],
TYPE: [
[
'nativeType',
convertMarkdownToHtml(
'A purely type system modification function what wraps a Druid native type to make it into a SQL type.',
),
],
],
UNNEST: [
[
'arrayExpression',
convertMarkdownToHtml("Unnests ARRAY typed values. The source for UNNEST can be an array type column, or an input that's been transformed into an array, such as with helper functions like `MV_TO_ARRAY` or `ARRAY`.")
]
]
};
function hasHtmlTags(str) {
return /<(a|br|span|div|p|code)\/?>/.test(str);
}
function sanitizeArguments(str) {
str = str.replace(/`<code>&#124;<\/code>`/g, '|'); // convert the hack to get | in a table to a normal pipe
// Ensure there are no more html tags other than the <code> we just removed
if (hasHtmlTags(str)) {
throw new Error(`Arguments contain HTML: ${str}`);
}
return str;
}
function convertMarkdownToHtml(markdown) {
markdown = markdown.replace(/<br\/?>/g, '\n'); // Convert inline <br> to newlines
// Ensure there are no more html tags other than the <br> we just removed
if (hasHtmlTags(markdown)) {
throw new Error(`Markdown contains HTML: ${markdown}`);
}
// Concert to markdown
markdown = snarkdown(markdown);
return markdown.replace(/<a[^>]*>(.*?)<\/a>/g, '$1'); // Remove links
}
const readDoc = async () => {
const data = [
await fs.readFile('../docs/querying/sql-data-types.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-scalar.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-aggregations.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-array-functions.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-multivalue-string-functions.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-json-functions.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-window-functions.md', 'utf-8'),
await fs.readFile('../docs/querying/sql-operators.md', 'utf-8'),
].join('\n');
const lines = data.split('\n');
const functionDocs = initialFunctionDocs;
const dataTypeDocs = {};
for (const line of lines) {
const functionMatch = line.match(/^\|\s*`(\w+)\(([^|]*)\)`\s*\|([^|]+)\|(?:([^|]+)\|)?$/);
if (functionMatch) {
const functionName = functionMatch[1];
const args = sanitizeArguments(functionMatch[2]);
const description = convertMarkdownToHtml(functionMatch[3]);
functionDocs[functionName] = functionDocs[functionName] || [];
functionDocs[functionName].push([args, description]);
}
const dataTypeMatch = line.match(/^\|([A-Z]+)\|([A-Z]+)\|([^|]*)\|([^|]*)\|$/);
if (dataTypeMatch) {
dataTypeDocs[dataTypeMatch[1]] = [dataTypeMatch[2], convertMarkdownToHtml(dataTypeMatch[4])];
}
}
// Make sure there are enough functions found
const numFunction = Object.keys(functionDocs).length;
if (!(MINIMUM_EXPECTED_NUMBER_OF_FUNCTIONS <= numFunction)) {
throw new Error(
`Did not find enough function entries did the file structure change? (found ${numFunction} but expected at least ${MINIMUM_EXPECTED_NUMBER_OF_FUNCTIONS})`,
);
}
// Make sure there are at least 10 data types for sanity
const numDataTypes = Object.keys(dataTypeDocs).length;
if (!(MINIMUM_EXPECTED_NUMBER_OF_DATA_TYPES <= numDataTypes)) {
throw new Error(
`Did not find enough data type entries did the file structure change? (found ${numDataTypes} but expected at least ${MINIMUM_EXPECTED_NUMBER_OF_DATA_TYPES})`,
);
}
const content = `/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
// This file is auto generated and should not be modified
// prettier-ignore
export const SQL_DATA_TYPES: Record<string, [runtime: string, description: string]> = ${JSON.stringify(
dataTypeDocs,
null,
2,
)};
// prettier-ignore
export const SQL_FUNCTIONS: Record<string, [args: string, description: string][]> = ${JSON.stringify(
functionDocs,
null,
2,
)};
`;
// eslint-disable-next-line no-undef
console.log(`Found ${numDataTypes} data types and ${numFunction} functions`);
await fs.writeFile(OUTPUT_FILE, content, 'utf-8');
};
readDoc();