src/Pure/System/standard_system.scala
author wenzelm
Wed, 14 Apr 2010 22:08:47 +0200
changeset 36144 89b1a136edef
parent 36039 6111de7c916a
child 36193 067a01827fca
permissions -rw-r--r--
more precise treatment of UNC server prefix, e.g. //foo;
wenzelm@34201
     1
/*  Title:      Pure/System/standard_system.scala
wenzelm@34201
     2
    Author:     Makarius
wenzelm@34201
     3
wenzelm@34201
     4
Standard system operations, with basic Cygwin/Posix compatibility.
wenzelm@34201
     5
*/
wenzelm@34201
     6
wenzelm@34201
     7
package isabelle
wenzelm@34201
     8
wenzelm@34201
     9
import java.util.regex.Pattern
wenzelm@34201
    10
import java.util.Locale
wenzelm@34201
    11
import java.io.{BufferedWriter, OutputStreamWriter, FileOutputStream,
wenzelm@34201
    12
  BufferedInputStream, FileInputStream, BufferedReader, InputStreamReader,
wenzelm@34298
    13
  File, FileFilter, IOException}
wenzelm@34201
    14
wenzelm@36035
    15
import scala.io.{Source, Codec}
wenzelm@34201
    16
import scala.util.matching.Regex
wenzelm@34201
    17
import scala.collection.mutable
wenzelm@34201
    18
wenzelm@34201
    19
wenzelm@34201
    20
object Standard_System
wenzelm@34201
    21
{
wenzelm@34201
    22
  val charset = "UTF-8"
wenzelm@36039
    23
  def codec(): Codec = Codec(charset)
wenzelm@34201
    24
wenzelm@34201
    25
wenzelm@34201
    26
  /* permissive UTF-8 decoding */
wenzelm@34201
    27
wenzelm@34201
    28
  // see also http://en.wikipedia.org/wiki/UTF-8#Description
wenzelm@34201
    29
  // overlong encodings enable byte-stuffing
wenzelm@34201
    30
wenzelm@34201
    31
  def decode_permissive_utf8(text: CharSequence): String =
wenzelm@34201
    32
  {
wenzelm@34201
    33
    val buf = new java.lang.StringBuilder(text.length)
wenzelm@34201
    34
    var code = -1
wenzelm@34201
    35
    var rest = 0
wenzelm@34201
    36
    def flush()
wenzelm@34201
    37
    {
wenzelm@34201
    38
      if (code != -1) {
wenzelm@34201
    39
        if (rest == 0 && Character.isValidCodePoint(code))
wenzelm@34201
    40
          buf.appendCodePoint(code)
wenzelm@34201
    41
        else buf.append('\uFFFD')
wenzelm@34201
    42
        code = -1
wenzelm@34201
    43
        rest = 0
wenzelm@34201
    44
      }
wenzelm@34201
    45
    }
wenzelm@34201
    46
    def init(x: Int, n: Int)
wenzelm@34201
    47
    {
wenzelm@34201
    48
      flush()
wenzelm@34201
    49
      code = x
wenzelm@34201
    50
      rest = n
wenzelm@34201
    51
    }
wenzelm@34201
    52
    def push(x: Int)
wenzelm@34201
    53
    {
wenzelm@34201
    54
      if (rest <= 0) init(x, -1)
wenzelm@34201
    55
      else {
wenzelm@34201
    56
        code <<= 6
wenzelm@34201
    57
        code += x
wenzelm@34201
    58
        rest -= 1
wenzelm@34201
    59
      }
wenzelm@34201
    60
    }
wenzelm@34201
    61
    for (i <- 0 until text.length) {
wenzelm@34201
    62
      val c = text.charAt(i)
wenzelm@34201
    63
      if (c < 128) { flush(); buf.append(c) }
wenzelm@34201
    64
      else if ((c & 0xC0) == 0x80) push(c & 0x3F)
wenzelm@34201
    65
      else if ((c & 0xE0) == 0xC0) init(c & 0x1F, 1)
wenzelm@34201
    66
      else if ((c & 0xF0) == 0xE0) init(c & 0x0F, 2)
wenzelm@34201
    67
      else if ((c & 0xF8) == 0xF0) init(c & 0x07, 3)
wenzelm@34201
    68
    }
wenzelm@34201
    69
    flush()
wenzelm@34201
    70
    buf.toString
wenzelm@34201
    71
  }
wenzelm@34201
    72
wenzelm@34201
    73
wenzelm@34201
    74
  /* basic file operations */
wenzelm@34201
    75
wenzelm@34201
    76
  def with_tmp_file[A](prefix: String)(body: File => A): A =
wenzelm@34201
    77
  {
wenzelm@34201
    78
    val file = File.createTempFile(prefix, null)
wenzelm@34201
    79
    try { body(file) } finally { file.delete }
wenzelm@34201
    80
  }
wenzelm@34201
    81
wenzelm@34201
    82
  def read_file(file: File): String =
wenzelm@34201
    83
  {
wenzelm@34201
    84
    val buf = new StringBuilder(file.length.toInt)
wenzelm@34201
    85
    val reader = new BufferedReader(new InputStreamReader(new FileInputStream(file), charset))
wenzelm@34201
    86
    var c = reader.read
wenzelm@34201
    87
    while (c != -1) {
wenzelm@34201
    88
      buf.append(c.toChar)
wenzelm@34201
    89
      c = reader.read
wenzelm@34201
    90
    }
wenzelm@34201
    91
    reader.close
wenzelm@34201
    92
    buf.toString
wenzelm@34201
    93
  }
wenzelm@34201
    94
wenzelm@34201
    95
  def write_file(file: File, text: CharSequence)
wenzelm@34201
    96
  {
wenzelm@34201
    97
    val writer = new BufferedWriter(new OutputStreamWriter(new FileOutputStream(file), charset))
wenzelm@34201
    98
    try { writer.append(text) }
wenzelm@34201
    99
    finally { writer.close }
wenzelm@34201
   100
  }
wenzelm@34201
   101
wenzelm@34300
   102
  // FIXME handle (potentially cyclic) directory graph
wenzelm@34298
   103
  def find_files(start: File, ok: File => Boolean): List[File] =
wenzelm@34298
   104
  {
wenzelm@34298
   105
    val files = new mutable.ListBuffer[File]
wenzelm@34298
   106
    val filter = new FileFilter { def accept(entry: File) = entry.isDirectory || ok(entry) }
wenzelm@34298
   107
    def find_entry(entry: File)
wenzelm@34298
   108
    {
wenzelm@34298
   109
      if (ok(entry)) files += entry
wenzelm@34298
   110
      if (entry.isDirectory) entry.listFiles(filter).foreach(find_entry)
wenzelm@34298
   111
    }
wenzelm@34298
   112
    find_entry(start)
wenzelm@34298
   113
    files.toList
wenzelm@34298
   114
  }
wenzelm@34298
   115
wenzelm@34201
   116
wenzelm@34201
   117
  /* shell processes */
wenzelm@34201
   118
wenzelm@34222
   119
  def raw_execute(cwd: File, env: Map[String, String], redirect: Boolean, args: String*): Process =
wenzelm@34201
   120
  {
wenzelm@34201
   121
    val cmdline = new java.util.LinkedList[String]
wenzelm@34201
   122
    for (s <- args) cmdline.add(s)
wenzelm@34201
   123
wenzelm@34201
   124
    val proc = new ProcessBuilder(cmdline)
wenzelm@34222
   125
    if (cwd != null) proc.directory(cwd)
wenzelm@34202
   126
    if (env != null) {
wenzelm@34202
   127
      proc.environment.clear
wenzelm@34202
   128
      for ((x, y) <- env) proc.environment.put(x, y)
wenzelm@34202
   129
    }
wenzelm@34201
   130
    proc.redirectErrorStream(redirect)
wenzelm@34201
   131
wenzelm@34201
   132
    try { proc.start }
wenzelm@34201
   133
    catch { case e: IOException => error(e.getMessage) }
wenzelm@34201
   134
  }
wenzelm@34201
   135
wenzelm@34201
   136
  def process_output(proc: Process): (String, Int) =
wenzelm@34201
   137
  {
wenzelm@34201
   138
    proc.getOutputStream.close
wenzelm@36039
   139
    val output = Source.fromInputStream(proc.getInputStream)(codec()).mkString  // FIXME
wenzelm@34201
   140
    val rc =
wenzelm@34201
   141
      try { proc.waitFor }
wenzelm@34201
   142
      finally {
wenzelm@34201
   143
        proc.getInputStream.close
wenzelm@34201
   144
        proc.getErrorStream.close
wenzelm@34201
   145
        proc.destroy
wenzelm@34201
   146
        Thread.interrupted
wenzelm@34201
   147
      }
wenzelm@34201
   148
    (output, rc)
wenzelm@34201
   149
  }
wenzelm@34258
   150
wenzelm@34258
   151
  def raw_exec(cwd: File, env: Map[String, String], redirect: Boolean, args: String*):
wenzelm@34258
   152
    (String, Int) = process_output(raw_execute(cwd, env, redirect, args: _*))
wenzelm@34201
   153
}
wenzelm@34201
   154
wenzelm@34201
   155
wenzelm@34201
   156
class Standard_System
wenzelm@34201
   157
{
wenzelm@34201
   158
  val platform_root = if (Platform.is_windows) Cygwin.check_root() else "/"
wenzelm@34201
   159
  override def toString = platform_root
wenzelm@34201
   160
wenzelm@34201
   161
wenzelm@34201
   162
  /* jvm_path */
wenzelm@34201
   163
wenzelm@34201
   164
  private val Cygdrive = new Regex("/cygdrive/([a-zA-Z])($|/.*)")
wenzelm@36144
   165
  private val Named_Root = new Regex("//+([^/]*)(.*)")
wenzelm@34201
   166
wenzelm@34201
   167
  def jvm_path(posix_path: String): String =
wenzelm@34201
   168
    if (Platform.is_windows) {
wenzelm@34201
   169
      val result_path = new StringBuilder
wenzelm@34201
   170
      val rest =
wenzelm@34201
   171
        posix_path match {
wenzelm@34201
   172
          case Cygdrive(drive, rest) =>
wenzelm@34201
   173
            result_path ++= (drive + ":" + File.separator)
wenzelm@34201
   174
            rest
wenzelm@36144
   175
          case Named_Root(root, rest) =>
wenzelm@36144
   176
            result_path ++= File.separator
wenzelm@36144
   177
            result_path ++= File.separator
wenzelm@36144
   178
            result_path ++= root
wenzelm@36144
   179
            rest
wenzelm@34201
   180
          case path if path.startsWith("/") =>
wenzelm@34201
   181
            result_path ++= platform_root
wenzelm@34201
   182
            path
wenzelm@34201
   183
          case path => path
wenzelm@34201
   184
        }
wenzelm@34201
   185
      for (p <- rest.split("/") if p != "") {
wenzelm@34201
   186
        val len = result_path.length
wenzelm@34201
   187
        if (len > 0 && result_path(len - 1) != File.separatorChar)
wenzelm@34201
   188
          result_path += File.separatorChar
wenzelm@34201
   189
        result_path ++= p
wenzelm@34201
   190
      }
wenzelm@34201
   191
      result_path.toString
wenzelm@34201
   192
    }
wenzelm@34201
   193
    else posix_path
wenzelm@34201
   194
wenzelm@34201
   195
wenzelm@34201
   196
  /* posix_path */
wenzelm@34201
   197
wenzelm@34201
   198
  private val Platform_Root = new Regex("(?i)" +
wenzelm@34201
   199
    Pattern.quote(platform_root) + """(?:\\+|\z)(.*)""")
wenzelm@34201
   200
wenzelm@34201
   201
  private val Drive = new Regex("""([a-zA-Z]):\\*(.*)""")
wenzelm@34201
   202
wenzelm@34201
   203
  def posix_path(jvm_path: String): String =
wenzelm@34201
   204
    if (Platform.is_windows) {
wenzelm@34201
   205
      jvm_path.replace('/', '\\') match {
wenzelm@34201
   206
        case Platform_Root(rest) => "/" + rest.replace('\\', '/')
wenzelm@34201
   207
        case Drive(letter, rest) =>
wenzelm@34201
   208
          "/cygdrive/" + letter.toLowerCase(Locale.ENGLISH) +
wenzelm@34201
   209
            (if (rest == "") "" else "/" + rest.replace('\\', '/'))
wenzelm@34201
   210
        case path => path.replace('\\', '/')
wenzelm@34201
   211
      }
wenzelm@34201
   212
    }
wenzelm@34201
   213
    else jvm_path
wenzelm@34201
   214
}