wenzelm@34273
|
1 |
/* Title: Pure/Thy/thy_syntax.scala
|
wenzelm@34273
|
2 |
Author: Makarius
|
wenzelm@34273
|
3 |
|
wenzelm@38656
|
4 |
Superficial theory syntax: tokens and spans.
|
wenzelm@34273
|
5 |
*/
|
wenzelm@34273
|
6 |
|
wenzelm@34273
|
7 |
package isabelle
|
wenzelm@34273
|
8 |
|
wenzelm@34273
|
9 |
|
wenzelm@38495
|
10 |
import scala.collection.mutable
|
wenzelm@38656
|
11 |
import scala.annotation.tailrec
|
wenzelm@38495
|
12 |
|
wenzelm@38495
|
13 |
|
wenzelm@34308
|
14 |
object Thy_Syntax
|
wenzelm@34273
|
15 |
{
|
wenzelm@40711
|
16 |
/** nested structure **/
|
wenzelm@40711
|
17 |
|
wenzelm@40711
|
18 |
object Structure
|
wenzelm@40711
|
19 |
{
|
wenzelm@40747
|
20 |
sealed abstract class Entry { def length: Int }
|
wenzelm@40711
|
21 |
case class Block(val name: String, val body: List[Entry]) extends Entry
|
wenzelm@40711
|
22 |
{
|
wenzelm@40711
|
23 |
val length: Int = (0 /: body)(_ + _.length)
|
wenzelm@40711
|
24 |
}
|
wenzelm@40711
|
25 |
case class Atom(val command: Command) extends Entry
|
wenzelm@40711
|
26 |
{
|
wenzelm@40711
|
27 |
def length: Int = command.length
|
wenzelm@40711
|
28 |
}
|
wenzelm@40711
|
29 |
|
wenzelm@47682
|
30 |
def parse(syntax: Outer_Syntax, node_name: Document.Node.Name, text: CharSequence): Entry =
|
wenzelm@40711
|
31 |
{
|
wenzelm@40711
|
32 |
/* stack operations */
|
wenzelm@40711
|
33 |
|
wenzelm@40711
|
34 |
def buffer(): mutable.ListBuffer[Entry] = new mutable.ListBuffer[Entry]
|
wenzelm@45506
|
35 |
var stack: List[(Int, String, mutable.ListBuffer[Entry])] =
|
wenzelm@45506
|
36 |
List((0, "theory " + node_name.theory, buffer()))
|
wenzelm@40711
|
37 |
|
wenzelm@40711
|
38 |
@tailrec def close(level: Int => Boolean)
|
wenzelm@40711
|
39 |
{
|
wenzelm@40711
|
40 |
stack match {
|
wenzelm@40711
|
41 |
case (lev, name, body) :: (_, _, body2) :: rest if level(lev) =>
|
wenzelm@40711
|
42 |
body2 += Block(name, body.toList)
|
wenzelm@40711
|
43 |
stack = stack.tail
|
wenzelm@40711
|
44 |
close(level)
|
wenzelm@40711
|
45 |
case _ =>
|
wenzelm@40711
|
46 |
}
|
wenzelm@40711
|
47 |
}
|
wenzelm@40711
|
48 |
|
wenzelm@40711
|
49 |
def result(): Entry =
|
wenzelm@40711
|
50 |
{
|
wenzelm@40711
|
51 |
close(_ => true)
|
wenzelm@40711
|
52 |
val (_, name, body) = stack.head
|
wenzelm@40711
|
53 |
Block(name, body.toList)
|
wenzelm@40711
|
54 |
}
|
wenzelm@40711
|
55 |
|
wenzelm@40711
|
56 |
def add(command: Command)
|
wenzelm@40711
|
57 |
{
|
wenzelm@40711
|
58 |
syntax.heading_level(command) match {
|
wenzelm@40711
|
59 |
case Some(i) =>
|
wenzelm@40714
|
60 |
close(_ >= i)
|
wenzelm@40711
|
61 |
stack = (i, command.source, buffer()) :: stack
|
wenzelm@40711
|
62 |
case None =>
|
wenzelm@40711
|
63 |
}
|
wenzelm@40711
|
64 |
stack.head._3 += Atom(command)
|
wenzelm@40711
|
65 |
}
|
wenzelm@40711
|
66 |
|
wenzelm@40711
|
67 |
|
wenzelm@40711
|
68 |
/* result structure */
|
wenzelm@40711
|
69 |
|
wenzelm@40711
|
70 |
val spans = parse_spans(syntax.scan(text))
|
wenzelm@46515
|
71 |
spans.foreach(span => add(Command(node_name, span)))
|
wenzelm@40711
|
72 |
result()
|
wenzelm@40711
|
73 |
}
|
wenzelm@40711
|
74 |
}
|
wenzelm@40711
|
75 |
|
wenzelm@40711
|
76 |
|
wenzelm@40711
|
77 |
|
wenzelm@38656
|
78 |
/** parse spans **/
|
wenzelm@38656
|
79 |
|
wenzelm@38655
|
80 |
def parse_spans(toks: List[Token]): List[List[Token]] =
|
wenzelm@34273
|
81 |
{
|
wenzelm@38655
|
82 |
val result = new mutable.ListBuffer[List[Token]]
|
wenzelm@38495
|
83 |
val span = new mutable.ListBuffer[Token]
|
wenzelm@34273
|
84 |
|
wenzelm@47682
|
85 |
def flush() { if (!span.isEmpty) { result += span.toList; span.clear } }
|
wenzelm@47682
|
86 |
for (tok <- toks) { if (tok.is_command) flush(); span += tok }
|
wenzelm@47682
|
87 |
flush()
|
wenzelm@38495
|
88 |
result.toList
|
wenzelm@34273
|
89 |
}
|
wenzelm@38656
|
90 |
|
wenzelm@38656
|
91 |
|
wenzelm@38656
|
92 |
|
wenzelm@45324
|
93 |
/** perspective **/
|
wenzelm@45295
|
94 |
|
wenzelm@45295
|
95 |
def command_perspective(node: Document.Node, perspective: Text.Perspective): Command.Perspective =
|
wenzelm@45295
|
96 |
{
|
wenzelm@45395
|
97 |
if (perspective.is_empty) Command.Perspective.empty
|
wenzelm@45295
|
98 |
else {
|
wenzelm@45295
|
99 |
val result = new mutable.ListBuffer[Command]
|
wenzelm@45295
|
100 |
@tailrec
|
wenzelm@45295
|
101 |
def check_ranges(ranges: List[Text.Range], commands: Stream[(Command, Text.Offset)])
|
wenzelm@45295
|
102 |
{
|
wenzelm@45295
|
103 |
(ranges, commands) match {
|
wenzelm@45295
|
104 |
case (range :: more_ranges, (command, offset) #:: more_commands) =>
|
wenzelm@45295
|
105 |
val command_range = command.range + offset
|
wenzelm@45295
|
106 |
range compare command_range match {
|
wenzelm@45295
|
107 |
case -1 => check_ranges(more_ranges, commands)
|
wenzelm@45295
|
108 |
case 0 =>
|
wenzelm@45295
|
109 |
result += command
|
wenzelm@45295
|
110 |
check_ranges(ranges, more_commands)
|
wenzelm@45295
|
111 |
case 1 => check_ranges(ranges, more_commands)
|
wenzelm@45295
|
112 |
}
|
wenzelm@45295
|
113 |
case _ =>
|
wenzelm@45295
|
114 |
}
|
wenzelm@45295
|
115 |
}
|
wenzelm@45394
|
116 |
check_ranges(perspective.ranges, node.command_range(perspective.range).toStream)
|
wenzelm@45395
|
117 |
Command.Perspective(result.toList)
|
wenzelm@45295
|
118 |
}
|
wenzelm@45295
|
119 |
}
|
wenzelm@45295
|
120 |
|
wenzelm@45506
|
121 |
def update_perspective(nodes: Document.Nodes,
|
wenzelm@45506
|
122 |
name: Document.Node.Name, text_perspective: Text.Perspective)
|
wenzelm@45324
|
123 |
: (Command.Perspective, Option[Document.Nodes]) =
|
wenzelm@45324
|
124 |
{
|
wenzelm@45324
|
125 |
val node = nodes(name)
|
wenzelm@45324
|
126 |
val perspective = command_perspective(node, text_perspective)
|
wenzelm@45324
|
127 |
val new_nodes =
|
wenzelm@45395
|
128 |
if (node.perspective same perspective) None
|
wenzelm@47552
|
129 |
else Some(nodes + (name -> node.update_perspective(perspective)))
|
wenzelm@45324
|
130 |
(perspective, new_nodes)
|
wenzelm@45324
|
131 |
}
|
wenzelm@45324
|
132 |
|
wenzelm@45506
|
133 |
def edit_perspective(previous: Document.Version,
|
wenzelm@45506
|
134 |
name: Document.Node.Name, text_perspective: Text.Perspective)
|
wenzelm@45324
|
135 |
: (Command.Perspective, Document.Version) =
|
wenzelm@45324
|
136 |
{
|
wenzelm@45324
|
137 |
val nodes = previous.nodes
|
wenzelm@45324
|
138 |
val (perspective, new_nodes) = update_perspective(nodes, name, text_perspective)
|
wenzelm@47815
|
139 |
val version = Document.Version.make(previous.syntax, new_nodes getOrElse nodes)
|
wenzelm@45324
|
140 |
(perspective, version)
|
wenzelm@45324
|
141 |
}
|
wenzelm@45324
|
142 |
|
wenzelm@45295
|
143 |
|
wenzelm@45295
|
144 |
|
wenzelm@47820
|
145 |
/** header edits: structure and outer syntax **/
|
wenzelm@47820
|
146 |
|
wenzelm@47820
|
147 |
private def header_edits(
|
wenzelm@47820
|
148 |
base_syntax: Outer_Syntax,
|
wenzelm@47820
|
149 |
previous: Document.Version,
|
wenzelm@47820
|
150 |
edits: List[Document.Edit_Text])
|
wenzelm@47820
|
151 |
: (Outer_Syntax, List[Document.Node.Name], Document.Nodes, List[Document.Edit_Command]) =
|
wenzelm@47820
|
152 |
{
|
wenzelm@47820
|
153 |
var rebuild_syntax = previous.is_init
|
wenzelm@47820
|
154 |
var nodes = previous.nodes
|
wenzelm@47820
|
155 |
val doc_edits = new mutable.ListBuffer[Document.Edit_Command]
|
wenzelm@47820
|
156 |
|
wenzelm@47820
|
157 |
edits foreach {
|
wenzelm@47820
|
158 |
case (name, Document.Node.Header(header)) =>
|
wenzelm@47820
|
159 |
val node = nodes(name)
|
wenzelm@47820
|
160 |
val update_header =
|
wenzelm@47820
|
161 |
(node.header, header) match {
|
wenzelm@47820
|
162 |
case (Exn.Res(deps0), Exn.Res(deps)) => deps0 != deps
|
wenzelm@47820
|
163 |
case _ => true
|
wenzelm@47820
|
164 |
}
|
wenzelm@47820
|
165 |
if (update_header) {
|
wenzelm@47820
|
166 |
val node1 = node.update_header(header)
|
wenzelm@47820
|
167 |
rebuild_syntax = rebuild_syntax || (node.keywords != node1.keywords)
|
wenzelm@47820
|
168 |
nodes += (name -> node1)
|
wenzelm@47820
|
169 |
doc_edits += (name -> Document.Node.Header(header))
|
wenzelm@47820
|
170 |
}
|
wenzelm@47820
|
171 |
case _ =>
|
wenzelm@47820
|
172 |
}
|
wenzelm@47820
|
173 |
|
wenzelm@47820
|
174 |
val syntax =
|
wenzelm@47820
|
175 |
if (rebuild_syntax)
|
wenzelm@47820
|
176 |
(base_syntax /: nodes.entries)({ case (syn, (_, node)) => (syn /: node.keywords)(_ + _) })
|
wenzelm@47820
|
177 |
else previous.syntax
|
wenzelm@47820
|
178 |
|
wenzelm@47820
|
179 |
val reparse =
|
wenzelm@47820
|
180 |
if (rebuild_syntax) nodes.descendants(doc_edits.iterator.map(_._1).toList)
|
wenzelm@47820
|
181 |
else Nil
|
wenzelm@47820
|
182 |
|
wenzelm@47820
|
183 |
(syntax, reparse, nodes, doc_edits.toList)
|
wenzelm@47820
|
184 |
}
|
wenzelm@47820
|
185 |
|
wenzelm@47820
|
186 |
|
wenzelm@47820
|
187 |
|
wenzelm@38656
|
188 |
/** text edits **/
|
wenzelm@38656
|
189 |
|
wenzelm@47820
|
190 |
/* phase 1: edit individual command source */
|
wenzelm@47820
|
191 |
|
wenzelm@47820
|
192 |
@tailrec private def edit_text(eds: List[Text.Edit], commands: Linear_Set[Command])
|
wenzelm@47820
|
193 |
: Linear_Set[Command] =
|
wenzelm@47820
|
194 |
{
|
wenzelm@47820
|
195 |
eds match {
|
wenzelm@47820
|
196 |
case e :: es =>
|
wenzelm@47820
|
197 |
Document.Node.command_starts(commands.iterator).find {
|
wenzelm@47820
|
198 |
case (cmd, cmd_start) =>
|
wenzelm@47820
|
199 |
e.can_edit(cmd.source, cmd_start) ||
|
wenzelm@47820
|
200 |
e.is_insert && e.start == cmd_start + cmd.length
|
wenzelm@47820
|
201 |
} match {
|
wenzelm@47820
|
202 |
case Some((cmd, cmd_start)) if e.can_edit(cmd.source, cmd_start) =>
|
wenzelm@47820
|
203 |
val (rest, text) = e.edit(cmd.source, cmd_start)
|
wenzelm@47820
|
204 |
val new_commands = commands.insert_after(Some(cmd), Command.unparsed(text)) - cmd
|
wenzelm@47820
|
205 |
edit_text(rest.toList ::: es, new_commands)
|
wenzelm@47820
|
206 |
|
wenzelm@47820
|
207 |
case Some((cmd, cmd_start)) =>
|
wenzelm@47820
|
208 |
edit_text(es, commands.insert_after(Some(cmd), Command.unparsed(e.text)))
|
wenzelm@47820
|
209 |
|
wenzelm@47820
|
210 |
case None =>
|
wenzelm@47820
|
211 |
require(e.is_insert && e.start == 0)
|
wenzelm@47820
|
212 |
edit_text(es, commands.insert_after(None, Command.unparsed(e.text)))
|
wenzelm@47820
|
213 |
}
|
wenzelm@47820
|
214 |
case Nil => commands
|
wenzelm@47820
|
215 |
}
|
wenzelm@47820
|
216 |
}
|
wenzelm@47820
|
217 |
|
wenzelm@47820
|
218 |
|
wenzelm@47820
|
219 |
/* phase 2: recover command spans */
|
wenzelm@47820
|
220 |
|
wenzelm@47820
|
221 |
@tailrec private def recover_spans(
|
wenzelm@47820
|
222 |
syntax: Outer_Syntax,
|
wenzelm@47820
|
223 |
node_name: Document.Node.Name,
|
wenzelm@47820
|
224 |
commands: Linear_Set[Command]): Linear_Set[Command] =
|
wenzelm@47820
|
225 |
{
|
wenzelm@47820
|
226 |
commands.iterator.find(cmd => !cmd.is_defined) match {
|
wenzelm@47820
|
227 |
case Some(first_unparsed) =>
|
wenzelm@47820
|
228 |
val first =
|
wenzelm@47820
|
229 |
commands.reverse_iterator(first_unparsed).
|
wenzelm@47820
|
230 |
dropWhile(_.newlines == 0).find(_.is_command) getOrElse commands.head
|
wenzelm@47820
|
231 |
val last =
|
wenzelm@47820
|
232 |
commands.iterator(first_unparsed).
|
wenzelm@47820
|
233 |
dropWhile(_.newlines == 0).find(_.is_command) getOrElse commands.last
|
wenzelm@47820
|
234 |
val range =
|
wenzelm@47820
|
235 |
commands.iterator(first).takeWhile(_ != last).toList ::: List(last)
|
wenzelm@47820
|
236 |
|
wenzelm@47820
|
237 |
val spans0 = parse_spans(syntax.scan(range.map(_.source).mkString))
|
wenzelm@47820
|
238 |
|
wenzelm@47820
|
239 |
val (before_edit, spans1) =
|
wenzelm@47820
|
240 |
if (!spans0.isEmpty && first.is_command && first.span == spans0.head)
|
wenzelm@47820
|
241 |
(Some(first), spans0.tail)
|
wenzelm@47820
|
242 |
else (commands.prev(first), spans0)
|
wenzelm@47820
|
243 |
|
wenzelm@47820
|
244 |
val (after_edit, spans2) =
|
wenzelm@47820
|
245 |
if (!spans1.isEmpty && last.is_command && last.span == spans1.last)
|
wenzelm@47820
|
246 |
(Some(last), spans1.take(spans1.length - 1))
|
wenzelm@47820
|
247 |
else (commands.next(last), spans1)
|
wenzelm@47820
|
248 |
|
wenzelm@47820
|
249 |
val inserted = spans2.map(span => Command(Document.new_id(), node_name, span))
|
wenzelm@47820
|
250 |
val new_commands =
|
wenzelm@47820
|
251 |
commands.delete_between(before_edit, after_edit).append_after(before_edit, inserted)
|
wenzelm@47820
|
252 |
recover_spans(syntax, node_name, new_commands)
|
wenzelm@47820
|
253 |
|
wenzelm@47820
|
254 |
case None => commands
|
wenzelm@47820
|
255 |
}
|
wenzelm@47820
|
256 |
}
|
wenzelm@47820
|
257 |
|
wenzelm@47820
|
258 |
|
wenzelm@47820
|
259 |
/* phase 3: full reparsing after syntax change */
|
wenzelm@47820
|
260 |
|
wenzelm@47820
|
261 |
private def reparse_spans(
|
wenzelm@47820
|
262 |
syntax: Outer_Syntax,
|
wenzelm@47820
|
263 |
node_name: Document.Node.Name,
|
wenzelm@47820
|
264 |
commands: Linear_Set[Command]): Linear_Set[Command] =
|
wenzelm@47820
|
265 |
{
|
wenzelm@47820
|
266 |
val cmds = commands.toList
|
wenzelm@47820
|
267 |
val spans1 = parse_spans(syntax.scan(cmds.map(_.source).mkString))
|
wenzelm@47820
|
268 |
if (cmds.map(_.span) == spans1) commands
|
wenzelm@47820
|
269 |
else Linear_Set(spans1.map(span => Command(Document.new_id(), node_name, span)): _*)
|
wenzelm@47820
|
270 |
}
|
wenzelm@47820
|
271 |
|
wenzelm@47820
|
272 |
|
wenzelm@47820
|
273 |
/* main phase */
|
wenzelm@47820
|
274 |
|
wenzelm@44604
|
275 |
def text_edits(
|
wenzelm@47816
|
276 |
base_syntax: Outer_Syntax,
|
wenzelm@44604
|
277 |
previous: Document.Version,
|
wenzelm@45028
|
278 |
edits: List[Document.Edit_Text])
|
wenzelm@45028
|
279 |
: (List[Document.Edit_Command], Document.Version) =
|
wenzelm@38656
|
280 |
{
|
wenzelm@47820
|
281 |
val (syntax, reparse, nodes0, doc_edits0) = header_edits(base_syntax, previous, edits)
|
wenzelm@47820
|
282 |
val reparse_set = reparse.toSet
|
wenzelm@38656
|
283 |
|
wenzelm@47820
|
284 |
var nodes = nodes0
|
wenzelm@47820
|
285 |
val doc_edits = new mutable.ListBuffer[Document.Edit_Command]; doc_edits ++= doc_edits0
|
wenzelm@38656
|
286 |
|
wenzelm@47820
|
287 |
(edits ::: reparse.map((_, Document.Node.Edits(Nil)))) foreach {
|
wenzelm@47820
|
288 |
case (name, Document.Node.Clear()) =>
|
wenzelm@47820
|
289 |
doc_edits += (name -> Document.Node.Clear())
|
wenzelm@47820
|
290 |
nodes += (name -> nodes(name).clear)
|
wenzelm@38656
|
291 |
|
wenzelm@47820
|
292 |
case (name, Document.Node.Edits(text_edits)) =>
|
wenzelm@47820
|
293 |
val node = nodes(name)
|
wenzelm@47820
|
294 |
val commands0 = node.commands
|
wenzelm@47820
|
295 |
val commands1 = edit_text(text_edits, commands0)
|
wenzelm@47820
|
296 |
val commands2 = recover_spans(syntax, name, commands1) // FIXME somewhat slow
|
wenzelm@47820
|
297 |
val commands3 =
|
wenzelm@47820
|
298 |
if (reparse_set.contains(name)) reparse_spans(syntax, name, commands2) // slow
|
wenzelm@47820
|
299 |
else commands2
|
wenzelm@47820
|
300 |
|
wenzelm@47820
|
301 |
val removed_commands = commands0.iterator.filter(!commands3.contains(_)).toList
|
wenzelm@47820
|
302 |
val inserted_commands = commands3.iterator.filter(!commands0.contains(_)).toList
|
wenzelm@47820
|
303 |
|
wenzelm@47820
|
304 |
val cmd_edits =
|
wenzelm@47820
|
305 |
removed_commands.reverse.map(cmd => (commands0.prev(cmd), None)) :::
|
wenzelm@47820
|
306 |
inserted_commands.map(cmd => (commands3.prev(cmd), Some(cmd)))
|
wenzelm@47820
|
307 |
|
wenzelm@47820
|
308 |
doc_edits += (name -> Document.Node.Edits(cmd_edits))
|
wenzelm@47820
|
309 |
nodes += (name -> node.update_commands(commands3))
|
wenzelm@47820
|
310 |
|
wenzelm@47820
|
311 |
case (name, Document.Node.Header(_)) =>
|
wenzelm@47820
|
312 |
|
wenzelm@47820
|
313 |
case (name, Document.Node.Perspective(text_perspective)) =>
|
wenzelm@47820
|
314 |
update_perspective(nodes, name, text_perspective) match {
|
wenzelm@47820
|
315 |
case (_, None) =>
|
wenzelm@47820
|
316 |
case (perspective, Some(nodes1)) =>
|
wenzelm@47820
|
317 |
doc_edits += (name -> Document.Node.Perspective(perspective))
|
wenzelm@47820
|
318 |
nodes = nodes1
|
wenzelm@47820
|
319 |
}
|
wenzelm@38656
|
320 |
}
|
wenzelm@47820
|
321 |
(doc_edits.toList, Document.Version.make(syntax, nodes))
|
wenzelm@38656
|
322 |
}
|
wenzelm@34273
|
323 |
}
|