| #!/usr/bin/env python3 |
| # Copyright (C) 2022 The Android Open Source Project |
| # |
| # Licensed under the Apache License, Version 2.0 (the 'License'); |
| # you may not use this file except in compliance with the License. |
| # You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an 'AS IS' BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| |
| from dataclasses import dataclass |
| from re import Match |
| from typing import List, Optional, Tuple |
| |
| from python.generators.sql_processing.utils import ObjKind |
| from python.generators.sql_processing.utils import extract_comment |
| from python.generators.sql_processing.utils import match_pattern |
| from python.generators.sql_processing.utils import PATTERN_BY_KIND |
| |
| |
| class DocsExtractor: |
| """Extracts documentation for views/tables/functions from SQL.""" |
| path: str |
| module_name: str |
| sql: str |
| |
| @dataclass |
| class Annotation: |
| key: str |
| value: str |
| |
| @dataclass |
| class Extract: |
| """Extracted documentation for a single view/table/function.""" |
| obj_kind: ObjKind |
| obj_match: Match |
| |
| description: str |
| annotations: List['DocsExtractor.Annotation'] |
| |
| def __init__(self, path: str, module_name: str, sql: str): |
| self.path = path |
| self.module_name = module_name |
| self.sql = sql |
| |
| self.sql_lines = sql.split("\n") |
| self.errors = [] |
| |
| def extract(self) -> List[Extract]: |
| extracted = [] |
| extracted += self._extract_for_kind(ObjKind.table_view) |
| extracted += self._extract_for_kind(ObjKind.function) |
| extracted += self._extract_for_kind(ObjKind.table_function) |
| extracted += self._extract_for_kind(ObjKind.macro) |
| extracted += self._extract_for_kind(ObjKind.include) |
| return extracted |
| |
| def _extract_for_kind(self, kind: ObjKind) -> List[Extract]: |
| line_number_to_matches = match_pattern(PATTERN_BY_KIND[kind], self.sql) |
| extracts = [] |
| for line_number, match in sorted(list(line_number_to_matches.items())): |
| comment_lines = extract_comment(self.sql_lines, line_number) |
| e = self._extract_from_comment(kind, match, comment_lines) |
| if e: |
| extracts.append(e) |
| return extracts |
| |
| def _extract_from_comment(self, kind: ObjKind, match: Match, |
| comment_lines: List[str]) -> Optional[Extract]: |
| extract = DocsExtractor.Extract(kind, match, '', []) |
| for line in comment_lines: |
| assert line.startswith('--') |
| |
| # Remove the comment. |
| comment_stripped = line.lstrip('--') |
| stripped = comment_stripped.lstrip() |
| |
| # Check if the line is an annotation. |
| if not stripped.startswith('@'): |
| # We are not in annotation: if we haven't seen an annotation yet, we |
| # must be still be parsing the description. Just add to that |
| if not extract.annotations: |
| extract.description += comment_stripped + "\n" |
| continue |
| |
| # Otherwise, add to the latest annotation. |
| extract.annotations[-1].value += " " + stripped |
| continue |
| |
| # This line is an annotation: find its name and add a new entry |
| annotation, rest = stripped.split(' ', 1) |
| extract.annotations.append(DocsExtractor.Annotation(annotation, rest)) |
| return extract |