Draft conversion to DOM tree.
This commit is contained in:
parent
bd57dff091
commit
c08eb0a7cb
@ -1,2 +1,3 @@
|
|||||||
|
from . import dom
|
||||||
from .org_rw import *
|
from .org_rw import *
|
||||||
from .utils import *
|
from .utils import *
|
||||||
|
67
org_rw/dom.py
Normal file
67
org_rw/dom.py
Normal file
@ -0,0 +1,67 @@
|
|||||||
|
class PropertyDrawerNode:
|
||||||
|
def __init__(self):
|
||||||
|
self.children = []
|
||||||
|
|
||||||
|
def append(self, child):
|
||||||
|
self.children.append(child)
|
||||||
|
|
||||||
|
def __repr__(self):
|
||||||
|
return "<Properties: {}>".format(len(self.children))
|
||||||
|
|
||||||
|
|
||||||
|
class LogbookDrawerNode:
|
||||||
|
def __init__(self):
|
||||||
|
self.children = []
|
||||||
|
|
||||||
|
def append(self, child):
|
||||||
|
self.children.append(child)
|
||||||
|
|
||||||
|
def __repr__(self):
|
||||||
|
return "<Properties: {}>".format(len(self.children))
|
||||||
|
|
||||||
|
|
||||||
|
class PropertyNode:
|
||||||
|
def __init__(self, key, value):
|
||||||
|
self.key = key
|
||||||
|
self.value = value
|
||||||
|
|
||||||
|
def __repr__(self):
|
||||||
|
return "{{{}: {}}".format(self.key, self.value)
|
||||||
|
|
||||||
|
|
||||||
|
class ListGroupNode:
|
||||||
|
def __init__(self):
|
||||||
|
self.children = []
|
||||||
|
|
||||||
|
def append(self, child):
|
||||||
|
self.children.append(child)
|
||||||
|
|
||||||
|
def __repr__(self):
|
||||||
|
return "<List: {}>".format(len(self.children))
|
||||||
|
|
||||||
|
|
||||||
|
class Text:
|
||||||
|
def __init__(self, content):
|
||||||
|
self.content = content
|
||||||
|
|
||||||
|
|
||||||
|
class ListItem:
|
||||||
|
def __init__(self, content):
|
||||||
|
self.content = content
|
||||||
|
|
||||||
|
|
||||||
|
class BlockNode:
|
||||||
|
def append(self, child):
|
||||||
|
raise NotImplementedError()
|
||||||
|
|
||||||
|
|
||||||
|
class CodeBlock(BlockNode):
|
||||||
|
def __init__(self, header):
|
||||||
|
self.header = header
|
||||||
|
self.lines = []
|
||||||
|
|
||||||
|
def append(self, child):
|
||||||
|
self.lines.append(child)
|
||||||
|
|
||||||
|
def __repr__(self):
|
||||||
|
return "<Code: {}>".format(len(self.lines))
|
218
org_rw/org_rw.py
218
org_rw/org_rw.py
@ -10,6 +10,8 @@ from datetime import date, datetime, timedelta
|
|||||||
from enum import Enum
|
from enum import Enum
|
||||||
from typing import Generator, List, Tuple, Union
|
from typing import Generator, List, Tuple, Union
|
||||||
|
|
||||||
|
from . import dom
|
||||||
|
|
||||||
BASE_ENVIRONMENT = {
|
BASE_ENVIRONMENT = {
|
||||||
"org-footnote-section": "Footnotes",
|
"org-footnote-section": "Footnotes",
|
||||||
"org-options-keywords": (
|
"org-options-keywords": (
|
||||||
@ -93,6 +95,9 @@ END_SRC_RE = re.compile(r"^\s*#\+END_SRC\s*$", re.I)
|
|||||||
RESULTS_DRAWER_RE = re.compile(r"^\s*:results:\s*$", re.I)
|
RESULTS_DRAWER_RE = re.compile(r"^\s*:results:\s*$", re.I)
|
||||||
CodeSnippet = collections.namedtuple("CodeSnippet", ("name", "content", "result"))
|
CodeSnippet = collections.namedtuple("CodeSnippet", ("name", "content", "result"))
|
||||||
|
|
||||||
|
# Groupings
|
||||||
|
NON_FINISHED_GROUPS = (type(None), dom.ListGroupNode)
|
||||||
|
|
||||||
|
|
||||||
def get_tokens(value):
|
def get_tokens(value):
|
||||||
if isinstance(value, Text):
|
if isinstance(value, Text):
|
||||||
@ -169,6 +174,19 @@ def get_links_from_content(content):
|
|||||||
link_value.append(tok)
|
link_value.append(tok)
|
||||||
|
|
||||||
|
|
||||||
|
def get_line(item):
|
||||||
|
if isinstance(item, Text):
|
||||||
|
return item.linenum
|
||||||
|
elif isinstance(item, ListItem):
|
||||||
|
return item.linenum
|
||||||
|
elif isinstance(item, Property):
|
||||||
|
return item.linenum
|
||||||
|
elif isinstance(item, tuple):
|
||||||
|
return item[0]
|
||||||
|
else:
|
||||||
|
raise Exception("Unknown item type: {}".format(item))
|
||||||
|
|
||||||
|
|
||||||
class Headline:
|
class Headline:
|
||||||
def __init__(
|
def __init__(
|
||||||
self,
|
self,
|
||||||
@ -251,6 +269,86 @@ class Headline:
|
|||||||
# Remove from contents
|
# Remove from contents
|
||||||
self._remove_element_in_line(start_line + 1)
|
self._remove_element_in_line(start_line + 1)
|
||||||
|
|
||||||
|
def as_dom(self):
|
||||||
|
everything = (
|
||||||
|
self.keywords
|
||||||
|
+ self.contents
|
||||||
|
+ self.list_items
|
||||||
|
+ self.properties
|
||||||
|
+ self.structural
|
||||||
|
+ self.delimiters
|
||||||
|
)
|
||||||
|
|
||||||
|
tree = []
|
||||||
|
current_node = None
|
||||||
|
|
||||||
|
for line in sorted(everything, key=get_line):
|
||||||
|
# print("#-", current_node)
|
||||||
|
# print("=>", line)
|
||||||
|
if isinstance(line, Property):
|
||||||
|
assert isinstance(current_node, dom.PropertyDrawerNode)
|
||||||
|
current_node.append(dom.PropertyNode(line.key, line.value))
|
||||||
|
|
||||||
|
elif isinstance(line, Text):
|
||||||
|
if isinstance(current_node, dom.BlockNode):
|
||||||
|
current_node.append(dom.Text(line))
|
||||||
|
elif isinstance(current_node, dom.LogbookDrawerNode):
|
||||||
|
current_node.append(dom.Text(line))
|
||||||
|
else:
|
||||||
|
assert type(current_node) in NON_FINISHED_GROUPS
|
||||||
|
current_node = None
|
||||||
|
tree.append(dom.Text(line))
|
||||||
|
|
||||||
|
elif isinstance(line, ListItem):
|
||||||
|
if current_node is None:
|
||||||
|
current_node = dom.ListGroupNode()
|
||||||
|
tree.append(current_node)
|
||||||
|
assert isinstance(current_node, dom.ListGroupNode)
|
||||||
|
current_node.append(dom.ListItem(line))
|
||||||
|
|
||||||
|
elif (
|
||||||
|
isinstance(line, DelimiterLine)
|
||||||
|
and line.delimiter_type == DelimiterLineType.BEGIN_SRC
|
||||||
|
):
|
||||||
|
assert type(current_node) in NON_FINISHED_GROUPS
|
||||||
|
current_node = dom.CodeBlock(line)
|
||||||
|
current_node.append(current_node)
|
||||||
|
|
||||||
|
elif (
|
||||||
|
isinstance(line, DelimiterLine)
|
||||||
|
and line.delimiter_type == DelimiterLineType.END_SRC
|
||||||
|
):
|
||||||
|
assert isinstance(current_node, dom.BlockNode)
|
||||||
|
current_node = None
|
||||||
|
|
||||||
|
elif (
|
||||||
|
isinstance(line, tuple)
|
||||||
|
and len(line) == 2
|
||||||
|
and isinstance(line[0], int)
|
||||||
|
and isinstance(line[1], str)
|
||||||
|
):
|
||||||
|
# Structural
|
||||||
|
(linenum, content) = line
|
||||||
|
if content.strip().upper() == ":PROPERTIES:":
|
||||||
|
assert current_node is None
|
||||||
|
current_node = dom.PropertyDrawerNode()
|
||||||
|
tree.append(current_node)
|
||||||
|
elif content.strip().upper() == ":LOGBOOK:":
|
||||||
|
assert current_node is None
|
||||||
|
current_node = dom.LogbookDrawerNode()
|
||||||
|
tree.append(current_node)
|
||||||
|
elif content.strip().upper() == ":END:":
|
||||||
|
assert isinstance(
|
||||||
|
current_node, dom.PropertyDrawerNode
|
||||||
|
) or isinstance(current_node, dom.LogbookDrawerNode)
|
||||||
|
current_node = None
|
||||||
|
else:
|
||||||
|
raise Exception("Unknown structural line: {}".format(line))
|
||||||
|
else:
|
||||||
|
raise Exception("Unknown node type: {}".format(line))
|
||||||
|
|
||||||
|
return tree
|
||||||
|
|
||||||
def getLists(self):
|
def getLists(self):
|
||||||
lists = []
|
lists = []
|
||||||
last_line = None
|
last_line = None
|
||||||
@ -1281,6 +1379,61 @@ def parse_headline(hl, doc, parent) -> Headline:
|
|||||||
return headline
|
return headline
|
||||||
|
|
||||||
|
|
||||||
|
def dump_kw(kw):
|
||||||
|
options = kw.match.group("options")
|
||||||
|
if not options:
|
||||||
|
options = ""
|
||||||
|
|
||||||
|
return (
|
||||||
|
kw.linenum,
|
||||||
|
"{indentation}#+{key}{options}:{spacing}{value}".format(
|
||||||
|
indentation=kw.match.group("indentation"),
|
||||||
|
key=kw.key,
|
||||||
|
options=kw.options,
|
||||||
|
spacing=kw.match.group("spacing"),
|
||||||
|
value=kw.value,
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
def dump_property(prop: Property):
|
||||||
|
plus = ""
|
||||||
|
indentation = ""
|
||||||
|
spacing = " "
|
||||||
|
if prop.match is not None:
|
||||||
|
plus = prop.match.group("plus")
|
||||||
|
if plus is None:
|
||||||
|
plus = ""
|
||||||
|
indentation = prop.match.group("indentation")
|
||||||
|
spacing = prop.match.group("spacing")
|
||||||
|
|
||||||
|
if isinstance(prop.value, TimeRange):
|
||||||
|
value = timerange_to_string(prop.value)
|
||||||
|
elif isinstance(prop.value, OrgTime):
|
||||||
|
value = prop.value.to_raw()
|
||||||
|
else:
|
||||||
|
value = prop.value
|
||||||
|
|
||||||
|
return (
|
||||||
|
prop.linenum,
|
||||||
|
"{indentation}:{key}{plus}:{spacing}{value}".format(
|
||||||
|
indentation=indentation,
|
||||||
|
key=prop.key,
|
||||||
|
plus=plus,
|
||||||
|
spacing=spacing,
|
||||||
|
value=value,
|
||||||
|
),
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
def dump_structural(structural: Tuple):
|
||||||
|
return (structural[0], structural[1])
|
||||||
|
|
||||||
|
|
||||||
|
def dump_delimiters(line: DelimiterLine):
|
||||||
|
return (line.linenum, line.line)
|
||||||
|
|
||||||
|
|
||||||
class OrgDoc:
|
class OrgDoc:
|
||||||
def __init__(
|
def __init__(
|
||||||
self, headlines, keywords, contents, list_items, structural, properties
|
self, headlines, keywords, contents, list_items, structural, properties
|
||||||
@ -1350,57 +1503,6 @@ class OrgDoc:
|
|||||||
yield from headline.get_code_snippets()
|
yield from headline.get_code_snippets()
|
||||||
|
|
||||||
# Writing
|
# Writing
|
||||||
def dump_kw(self, kw):
|
|
||||||
options = kw.match.group("options")
|
|
||||||
if not options:
|
|
||||||
options = ""
|
|
||||||
|
|
||||||
return (
|
|
||||||
kw.linenum,
|
|
||||||
"{indentation}#+{key}{options}:{spacing}{value}".format(
|
|
||||||
indentation=kw.match.group("indentation"),
|
|
||||||
key=kw.key,
|
|
||||||
options=kw.options,
|
|
||||||
spacing=kw.match.group("spacing"),
|
|
||||||
value=kw.value,
|
|
||||||
),
|
|
||||||
)
|
|
||||||
|
|
||||||
def dump_property(self, prop: Property):
|
|
||||||
plus = ""
|
|
||||||
indentation = ""
|
|
||||||
spacing = " "
|
|
||||||
if prop.match is not None:
|
|
||||||
plus = prop.match.group("plus")
|
|
||||||
if plus is None:
|
|
||||||
plus = ""
|
|
||||||
indentation = prop.match.group("indentation")
|
|
||||||
spacing = prop.match.group("spacing")
|
|
||||||
|
|
||||||
if isinstance(prop.value, TimeRange):
|
|
||||||
value = timerange_to_string(prop.value)
|
|
||||||
elif isinstance(prop.value, OrgTime):
|
|
||||||
value = prop.value.to_raw()
|
|
||||||
else:
|
|
||||||
value = prop.value
|
|
||||||
|
|
||||||
return (
|
|
||||||
prop.linenum,
|
|
||||||
"{indentation}:{key}{plus}:{spacing}{value}".format(
|
|
||||||
indentation=indentation,
|
|
||||||
key=prop.key,
|
|
||||||
plus=plus,
|
|
||||||
spacing=spacing,
|
|
||||||
value=value,
|
|
||||||
),
|
|
||||||
)
|
|
||||||
|
|
||||||
def dump_structural(self, structural: Tuple):
|
|
||||||
return (structural[0], structural[1])
|
|
||||||
|
|
||||||
def dump_delimiters(self, line: DelimiterLine):
|
|
||||||
return (line.linenum, line.line)
|
|
||||||
|
|
||||||
def dump_headline(self, headline):
|
def dump_headline(self, headline):
|
||||||
|
|
||||||
tags = ""
|
tags = ""
|
||||||
@ -1423,7 +1525,7 @@ class OrgDoc:
|
|||||||
PROPERTIES_T = 2
|
PROPERTIES_T = 2
|
||||||
STRUCTURAL_T = 3
|
STRUCTURAL_T = 3
|
||||||
for keyword in headline.keywords:
|
for keyword in headline.keywords:
|
||||||
lines.append((KW_T, self.dump_kw(keyword)))
|
lines.append((KW_T, dump_kw(keyword)))
|
||||||
|
|
||||||
for content in headline.contents:
|
for content in headline.contents:
|
||||||
lines.append((CONTENT_T, dump_contents(content)))
|
lines.append((CONTENT_T, dump_contents(content)))
|
||||||
@ -1432,13 +1534,13 @@ class OrgDoc:
|
|||||||
lines.append((CONTENT_T, dump_contents(li)))
|
lines.append((CONTENT_T, dump_contents(li)))
|
||||||
|
|
||||||
for prop in headline.properties:
|
for prop in headline.properties:
|
||||||
lines.append((PROPERTIES_T, self.dump_property(prop)))
|
lines.append((PROPERTIES_T, dump_property(prop)))
|
||||||
|
|
||||||
for struct in headline.structural:
|
for struct in headline.structural:
|
||||||
lines.append((STRUCTURAL_T, self.dump_structural(struct)))
|
lines.append((STRUCTURAL_T, dump_structural(struct)))
|
||||||
|
|
||||||
for content in headline.delimiters:
|
for content in headline.delimiters:
|
||||||
lines.append((STRUCTURAL_T, self.dump_delimiters(content)))
|
lines.append((STRUCTURAL_T, dump_delimiters(content)))
|
||||||
|
|
||||||
lines = sorted(lines, key=lambda x: x[1][0])
|
lines = sorted(lines, key=lambda x: x[1][0])
|
||||||
|
|
||||||
@ -1500,13 +1602,13 @@ class OrgDoc:
|
|||||||
def dump(self):
|
def dump(self):
|
||||||
lines = []
|
lines = []
|
||||||
for prop in self.properties:
|
for prop in self.properties:
|
||||||
lines.append(self.dump_property(prop))
|
lines.append(dump_property(prop))
|
||||||
|
|
||||||
for struct in self.structural:
|
for struct in self.structural:
|
||||||
lines.append(self.dump_structural(struct))
|
lines.append(dump_structural(struct))
|
||||||
|
|
||||||
for kw in self.keywords:
|
for kw in self.keywords:
|
||||||
lines.append(self.dump_kw(kw))
|
lines.append(dump_kw(kw))
|
||||||
|
|
||||||
for line in self.contents:
|
for line in self.contents:
|
||||||
lines.append(dump_contents(line))
|
lines.append(dump_contents(line))
|
||||||
|
Loading…
Reference in New Issue
Block a user