src/Pure/General/url.scala
author nipkow
Tue, 05 Nov 2019 21:07:03 +0100
changeset 71044 cb504351d058
parent 69901 20b32ade0024
child 71163 b5822f4c3fde
permissions -rw-r--r--
tuned
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
56501
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     1
/*  Title:      Pure/General/url.scala
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     2
    Author:     Makarius
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     3
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     4
Basic URL operations.
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     5
*/
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     6
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     7
package isabelle
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     8
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
     9
64729
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    10
import java.io.{File => JFile}
65188
50cfc6775361 more complete exception handling;
wenzelm
parents: 65069
diff changeset
    11
import java.nio.file.{Paths, FileSystemNotFoundException}
67245
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    12
import java.net.{URI, URISyntaxException, URL, MalformedURLException, URLDecoder, URLEncoder}
69901
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    13
import java.util.Locale
63642
d83a1eeff9d2 more operations;
wenzelm
parents: 62248
diff changeset
    14
import java.util.zip.GZIPInputStream
56501
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    15
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    16
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    17
object Url
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    18
{
69901
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    19
  /* special characters */
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    20
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    21
  def escape_special(c: Char): String =
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    22
    if ("!#$&'()*+,/:;=?@[]".contains(c)) String.format(Locale.ROOT, "%%%02X", new Integer(c.toInt))
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    23
    else c.toString
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    24
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    25
  def escape_special(s: String): String = s.iterator.map(escape_special(_)).mkString
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    26
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    27
  def escape_name(name: String): String =
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    28
    name.iterator.map({ case '\'' => "%27" case c => c.toString }).mkString
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    29
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    30
20b32ade0024 clarified signature;
wenzelm
parents: 69394
diff changeset
    31
  /* make and check URLs */
62248
dca0bac351b2 allow single quote within URL;
wenzelm
parents: 56503
diff changeset
    32
56501
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    33
  def apply(name: String): URL =
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    34
  {
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    35
    try { new URL(name) }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    36
    catch { case _: MalformedURLException => error("Malformed URL " + quote(name)) }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    37
  }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    38
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    39
  def is_wellformed(name: String): Boolean =
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    40
    try { Url(name); true }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    41
    catch { case ERROR(_) => false }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    42
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    43
  def is_readable(name: String): Boolean =
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    44
    try { Url(name).openStream.close; true }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    45
    catch { case ERROR(_) => false }
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    46
63642
d83a1eeff9d2 more operations;
wenzelm
parents: 62248
diff changeset
    47
67245
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    48
  /* strings */
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    49
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    50
  def decode(s: String): String = URLDecoder.decode(s, UTF8.charset_name)
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    51
  def encode(s: String): String = URLEncoder.encode(s, UTF8.charset_name)
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    52
caa4c9001009 tuned signature;
wenzelm
parents: 66235
diff changeset
    53
63642
d83a1eeff9d2 more operations;
wenzelm
parents: 62248
diff changeset
    54
  /* read */
d83a1eeff9d2 more operations;
wenzelm
parents: 62248
diff changeset
    55
63645
d7e0004d4321 more operations;
wenzelm
parents: 63642
diff changeset
    56
  private def read(url: URL, gzip: Boolean): String =
65069
wenzelm
parents: 64777
diff changeset
    57
    using(url.openStream)(stream =>
wenzelm
parents: 64777
diff changeset
    58
      File.read_stream(if (gzip) new GZIPInputStream(stream) else stream))
63642
d83a1eeff9d2 more operations;
wenzelm
parents: 62248
diff changeset
    59
63645
d7e0004d4321 more operations;
wenzelm
parents: 63642
diff changeset
    60
  def read(url: URL): String = read(url, false)
d7e0004d4321 more operations;
wenzelm
parents: 63642
diff changeset
    61
  def read_gzip(url: URL): String = read(url, true)
d7e0004d4321 more operations;
wenzelm
parents: 63642
diff changeset
    62
d7e0004d4321 more operations;
wenzelm
parents: 63642
diff changeset
    63
  def read(name: String): String = read(Url(name), false)
d7e0004d4321 more operations;
wenzelm
parents: 63642
diff changeset
    64
  def read_gzip(name: String): String = read(Url(name), true)
64729
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    65
69394
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    66
  def read_bytes(url: URL): Bytes =
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    67
  {
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    68
    val connection = url.openConnection
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    69
    val length = connection.getContentLength
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    70
    using(connection.getInputStream)(Bytes.read_stream(_, hint = length))
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    71
  }
f3240f3aa698 more operations;
wenzelm
parents: 67245
diff changeset
    72
64729
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    73
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    74
  /* file URIs */
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    75
66234
836898197296 clarified platform file operations;
wenzelm
parents: 65188
diff changeset
    76
  def print_file(file: JFile): String = File.absolute(file).toPath.toUri.toString
64777
ca09695eb43c clarified Document.Node.Name (again): canonical platform file;
wenzelm
parents: 64775
diff changeset
    77
  def print_file_name(name: String): String = print_file(new JFile(name))
64775
dd3797f1e0d6 clarified file URIs;
wenzelm
parents: 64766
diff changeset
    78
dd3797f1e0d6 clarified file URIs;
wenzelm
parents: 64766
diff changeset
    79
  def parse_file(uri: String): JFile = Paths.get(new URI(uri)).toFile
64729
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    80
4eccd9bc5fd9 clarified file URI operations;
wenzelm
parents: 63645
diff changeset
    81
  def is_wellformed_file(uri: String): Boolean =
64775
dd3797f1e0d6 clarified file URIs;
wenzelm
parents: 64766
diff changeset
    82
    try { parse_file(uri); true }
65188
50cfc6775361 more complete exception handling;
wenzelm
parents: 65069
diff changeset
    83
    catch {
50cfc6775361 more complete exception handling;
wenzelm
parents: 65069
diff changeset
    84
      case _: URISyntaxException | _: IllegalArgumentException | _: FileSystemNotFoundException =>
50cfc6775361 more complete exception handling;
wenzelm
parents: 65069
diff changeset
    85
        false
50cfc6775361 more complete exception handling;
wenzelm
parents: 65069
diff changeset
    86
    }
64730
76996d915894 clarified modules;
wenzelm
parents: 64729
diff changeset
    87
66235
d4fa51e7c4ff retain symlinks in file names from VSCode: relevant for proper file locations in decorations etc.;
wenzelm
parents: 66234
diff changeset
    88
  def absolute_file(uri: String): JFile = File.absolute(parse_file(uri))
d4fa51e7c4ff retain symlinks in file names from VSCode: relevant for proper file locations in decorations etc.;
wenzelm
parents: 66234
diff changeset
    89
  def absolute_file_name(uri: String): String = absolute_file(uri).getPath
d4fa51e7c4ff retain symlinks in file names from VSCode: relevant for proper file locations in decorations etc.;
wenzelm
parents: 66234
diff changeset
    90
66234
836898197296 clarified platform file operations;
wenzelm
parents: 65188
diff changeset
    91
  def canonical_file(uri: String): JFile = File.canonical(parse_file(uri))
64777
ca09695eb43c clarified Document.Node.Name (again): canonical platform file;
wenzelm
parents: 64775
diff changeset
    92
  def canonical_file_name(uri: String): String = canonical_file(uri).getPath
56501
5fda9e5c5874 basic URL operations (with Isabelle/Scala error handling);
wenzelm
parents:
diff changeset
    93
}