Merge: Added contributing guidelines and link from readme
[nit.git] / lib / core / file.nit
1 # This file is part of NIT ( http://www.nitlanguage.org ).
2 #
3 # Copyright 2004-2008 Jean Privat <jean@pryen.org>
4 # Copyright 2008 Floréal Morandat <morandat@lirmm.fr>
5 # Copyright 2008 Jean-Sébastien Gélinas <calestar@gmail.com>
6 #
7 # This file is free software, which comes along with NIT. This software is
8 # distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
9 # without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
10 # PARTICULAR PURPOSE. You can modify it is you want, provided this header
11 # is kept unaltered, and a notification of the changes is added.
12 # You are allowed to redistribute it and sell it, alone or is a part of
13 # another product.
14
15 # File manipulations (create, read, write, etc.)
16 module file
17
18 intrude import stream
19 intrude import text::ropes
20 import text
21 import time
22 import gc
23
24 in "C Header" `{
25 #include <dirent.h>
26 #include <string.h>
27 #include <sys/types.h>
28 #include <sys/stat.h>
29 #include <unistd.h>
30 #include <stdio.h>
31 #include <poll.h>
32 #include <errno.h>
33 `}
34
35 # `Stream` used to interact with a File or FileDescriptor
36 abstract class FileStream
37 super Stream
38 # The path of the file.
39 var path: nullable String = null
40
41 # The FILE *.
42 private var file: nullable NativeFile = null
43
44 # The status of a file. see POSIX stat(2).
45 #
46 # var f = new FileReader.open("/etc/issue")
47 # assert f.file_stat.is_file
48 #
49 # Return null in case of error
50 fun file_stat: nullable FileStat
51 do
52 var stat = _file.as(not null).file_stat
53 if stat.address_is_null then return null
54 return new FileStat(stat)
55 end
56
57 # File descriptor of this file
58 fun fd: Int do return _file.as(not null).fileno
59
60 redef fun close
61 do
62 var file = _file
63 if file == null then return
64 if file.address_is_null then
65 if last_error != null then return
66 last_error = new IOError("Cannot close unopened file")
67 return
68 end
69 var i = file.io_close
70 if i != 0 then
71 last_error = new IOError("Close failed due to error {sys.errno.strerror}")
72 end
73 _file = null
74 end
75
76 # Sets the buffering mode for the current FileStream
77 #
78 # If the buf_size is <= 0, its value will be 512 by default
79 #
80 # The mode is any of the buffer_mode enumeration in `Sys`:
81 #
82 # * `buffer_mode_full`
83 # * `buffer_mode_line`
84 # * `buffer_mode_none`
85 fun set_buffering_mode(buf_size, mode: Int) do
86 if buf_size <= 0 then buf_size = 512
87 if _file.as(not null).set_buffering_type(buf_size, mode) != 0 then
88 last_error = new IOError("Error while changing buffering type for FileStream, returned error {sys.errno.strerror}")
89 end
90 end
91 end
92
93 # `Stream` that can read from a File
94 class FileReader
95 super FileStream
96 super BufferedReader
97 super PollableReader
98 # Misc
99
100 # Open the same file again.
101 # The original path is reused, therefore the reopened file can be a different file.
102 #
103 # var f = new FileReader.open("/etc/issue")
104 # var l = f.read_line
105 # f.reopen
106 # assert l == f.read_line
107 fun reopen
108 do
109 if not eof and not _file.as(not null).address_is_null then close
110 last_error = null
111 _file = new NativeFile.io_open_read(path.as(not null).to_cstring)
112 if _file.as(not null).address_is_null then
113 last_error = new IOError("Cannot open `{path.as(not null)}`: {sys.errno.strerror}")
114 end_reached = true
115 return
116 end
117 end_reached = false
118 buffer_reset
119 end
120
121 redef fun close
122 do
123 super
124 buffer_reset
125 end_reached = true
126 end
127
128 redef fun fill_buffer
129 do
130 var nb = _file.as(not null).io_read(_buffer, _buffer_capacity)
131 if last_error == null and _file.as(not null).ferror then
132 last_error = new IOError("Cannot read `{path.as(not null)}`: {sys.errno.strerror}")
133 end_reached = true
134 end
135 if nb <= 0 then
136 end_reached = true
137 nb = 0
138 end
139 _buffer_length = nb
140 _buffer_pos = 0
141 end
142
143 # End of file?
144 redef var end_reached = false
145
146 # Open the file at `path` for reading.
147 #
148 # var f = new FileReader.open("/etc/issue")
149 # assert not f.end_reached
150 # f.close
151 #
152 # In case of error, `last_error` is set
153 #
154 # f = new FileReader.open("/fail/does not/exist")
155 # assert f.end_reached
156 # assert f.last_error != null
157 init open(path: String)
158 do
159 self.path = path
160 prepare_buffer(100)
161 _file = new NativeFile.io_open_read(path.to_cstring)
162 if _file.as(not null).address_is_null then
163 last_error = new IOError("Cannot open `{path}`: {sys.errno.strerror}")
164 end_reached = true
165 end
166 end
167
168 # Creates a new File stream from a file descriptor
169 #
170 # This is a low-level method.
171 init from_fd(fd: Int) do
172 self.path = ""
173 prepare_buffer(1)
174 _file = fd.fd_to_stream(read_only)
175 if _file.as(not null).address_is_null then
176 last_error = new IOError("Error: Converting fd {fd} to stream failed with '{sys.errno.strerror}'")
177 end_reached = true
178 end
179 end
180
181 redef fun poll_in
182 do
183 var res = native_poll_in(fd)
184 if res == -1 then
185 last_error = new IOError(errno.to_s)
186 return false
187 else return res > 0
188 end
189
190 private fun native_poll_in(fd: Int): Int `{
191 struct pollfd fds = {(int)fd, POLLIN, 0};
192 return poll(&fds, 1, 0);
193 `}
194 end
195
196 # `Stream` that can write to a File
197 class FileWriter
198 super FileStream
199 super Writer
200
201 redef fun write_bytes(s) do
202 if last_error != null then return
203 if not _is_writable then
204 last_error = new IOError("cannot write to non-writable stream")
205 return
206 end
207 write_native(s.items, 0, s.length)
208 end
209
210 redef fun write(s)
211 do
212 if last_error != null then return
213 if not _is_writable then
214 last_error = new IOError("cannot write to non-writable stream")
215 return
216 end
217 s.write_native_to(self)
218 end
219
220 redef fun write_byte(value)
221 do
222 if last_error != null then return
223 if not _is_writable then
224 last_error = new IOError("Cannot write to non-writable stream")
225 return
226 end
227 if _file.as(not null).address_is_null then
228 last_error = new IOError("Writing on a null stream")
229 _is_writable = false
230 return
231 end
232
233 var err = _file.as(not null).write_byte(value)
234 if err != 1 then
235 # Big problem
236 last_error = new IOError("Problem writing a byte: {err}")
237 end
238 end
239
240 redef fun close
241 do
242 super
243 _is_writable = false
244 end
245 redef var is_writable = false
246
247 # Write `len` bytes from `native`.
248 private fun write_native(native: NativeString, from, len: Int)
249 do
250 if last_error != null then return
251 if not _is_writable then
252 last_error = new IOError("Cannot write to non-writable stream")
253 return
254 end
255 if _file.as(not null).address_is_null then
256 last_error = new IOError("Writing on a null stream")
257 _is_writable = false
258 return
259 end
260 var err = _file.as(not null).io_write(native, from, len)
261 if err != len then
262 # Big problem
263 last_error = new IOError("Problem in writing : {err} {len} \n")
264 end
265 end
266
267 # Open the file at `path` for writing.
268 init open(path: String)
269 do
270 _file = new NativeFile.io_open_write(path.to_cstring)
271 self.path = path
272 _is_writable = true
273 if _file.as(not null).address_is_null then
274 last_error = new IOError("Cannot open `{path}`: {sys.errno.strerror}")
275 is_writable = false
276 end
277 end
278
279 # Creates a new File stream from a file descriptor
280 init from_fd(fd: Int) do
281 self.path = ""
282 _file = fd.fd_to_stream(wipe_write)
283 _is_writable = true
284 if _file.as(not null).address_is_null then
285 last_error = new IOError("Error: Opening stream from file descriptor {fd} failed with '{sys.errno.strerror}'")
286 _is_writable = false
287 end
288 end
289 end
290
291 redef class Int
292 # Creates a file stream from a file descriptor `fd` using the file access `mode`.
293 #
294 # NOTE: The `mode` specified must be compatible with the one used in the file descriptor.
295 private fun fd_to_stream(mode: NativeString): NativeFile `{
296 return fdopen((int)self, mode);
297 `}
298 end
299
300 # Constant for read-only file streams
301 private fun read_only: NativeString do return once "r".to_cstring
302
303 # Constant for write-only file streams
304 #
305 # If a stream is opened on a file with this method,
306 # it will wipe the previous file if any.
307 # Else, it will create the file.
308 private fun wipe_write: NativeString do return once "w".to_cstring
309
310 ###############################################################################
311
312 # Standard input stream.
313 #
314 # The class of the default value of `sys.stdin`.
315 class Stdin
316 super FileReader
317
318 init do
319 _file = new NativeFile.native_stdin
320 path = "/dev/stdin"
321 prepare_buffer(1)
322 end
323 end
324
325 # Standard output stream.
326 #
327 # The class of the default value of `sys.stdout`.
328 class Stdout
329 super FileWriter
330 init do
331 _file = new NativeFile.native_stdout
332 path = "/dev/stdout"
333 _is_writable = true
334 set_buffering_mode(256, sys.buffer_mode_line)
335 end
336 end
337
338 # Standard error stream.
339 #
340 # The class of the default value of `sys.stderr`.
341 class Stderr
342 super FileWriter
343 init do
344 _file = new NativeFile.native_stderr
345 path = "/dev/stderr"
346 _is_writable = true
347 end
348 end
349
350 ###############################################################################
351
352 redef class Writable
353 # Like `write_to` but take care of creating the file
354 fun write_to_file(filepath: String)
355 do
356 var stream = new FileWriter.open(filepath)
357 write_to(stream)
358 stream.close
359 end
360 end
361
362 # Utility class to access file system services.
363 #
364 # Usually created with `Text::to_path`.
365 #
366 # `Path` objects does not necessarily represent existing files in a file system.
367 # They are sate-less objects that efficiently represent path information.
368 # They also provide an easy to use API on file-system services and are used to store their error status (see `last_error`)
369 class Path
370
371 private var path: String
372
373 # Path to this file
374 redef fun to_s do return path
375
376 # Short name of the file at `to_s`
377 #
378 # ~~~
379 # var path = "/tmp/somefile".to_path
380 # assert path.filename == "somefile"
381 # ~~~
382 #
383 # The result does not depend of the file system, thus is cached for efficiency.
384 var filename: String = path.basename is lazy
385
386 # The path simplified by removing useless `.`, removing `//`, and resolving `..`
387 #
388 # ~~~
389 # var path = "somedir/./tmp/../somefile".to_path
390 # assert path.simplified.to_s == "somedir/somefile"
391 # ~~~
392 #
393 # See `String:simplify_path` for details.
394 #
395 # The result does not depend of the file system, thus is cached for efficiency.
396 var simplified: Path is lazy do
397 var res = path.simplify_path.to_path
398 res.simplified = res
399 return res
400 end
401
402 # Return the directory part of the path.
403 #
404 # ~~~
405 # var path = "/foo/bar/baz".to_path
406 # assert path.dir.to_s == "/foo/bar"
407 # assert path.dir.dir.to_s == "/foo"
408 # assert path.dir.dir.dir.to_s == "/"
409 # ~~~
410 #
411 # See `String:dirname` for details.
412 #
413 # The result does not depend of the file system, thus is cached for efficiency.
414 var dir: Path is lazy do
415 return path.dirname.to_path
416 end
417
418 # Last error produced by I/O operations.
419 #
420 # ~~~
421 # var path = "/does/not/exists".to_path
422 # assert path.last_error == null
423 # path.read_all
424 # assert path.last_error != null
425 # ~~~
426 #
427 # Since `Path` objects are stateless, `last_error` is reset on most operations and reflect its status.
428 var last_error: nullable IOError = null is writable
429
430 # Does the file at `path` exists?
431 #
432 # If the file does not exists, `last_error` is set to the information.
433 fun exists: Bool do return stat != null
434
435 # Information on the file at `self` following symbolic links
436 #
437 # Returns `null` if there is no file at `self`.
438 # `last_error` is updated to contains the error information on error, and null on success.
439 #
440 # assert "/etc/".to_path.stat.is_dir
441 # assert "/etc/issue".to_path.stat.is_file
442 # assert "/fail/does not/exist".to_path.stat == null
443 #
444 # ~~~
445 # var p = "/tmp/".to_path
446 # var stat = p.stat
447 # if stat != null then # Does `p` exist?
448 # print "It's size is {stat.size}"
449 # if stat.is_dir then print "It's a directory"
450 # else
451 # print p.last_error.to_s
452 # end
453 # ~~~
454 fun stat: nullable FileStat
455 do
456 var stat = path.to_cstring.file_stat
457 if stat.address_is_null then
458 last_error = new IOError("Cannot open `{path}`: {sys.errno.strerror}")
459 return null
460 end
461 last_error = null
462 return new FileStat(stat)
463 end
464
465 # Information on the file or link at `self`
466 #
467 # Do not follow symbolic links.
468 fun link_stat: nullable FileStat
469 do
470 var stat = path.to_cstring.file_lstat
471 if stat.address_is_null then
472 last_error = new IOError("Cannot open `{path}`: {sys.errno.strerror}")
473 return null
474 end
475 last_error = null
476 return new FileStat(stat)
477 end
478
479 # Delete a file from the file system.
480 #
481 # `last_error` is updated to contains the error information on error, and null on success.
482 fun delete
483 do
484 var res = path.to_cstring.file_delete
485 if not res then
486 last_error = new IOError("Cannot delete `{path}`: {sys.errno.strerror}")
487 else
488 last_error = null
489 end
490 end
491
492 # Copy content of file at `path` to `dest`.
493 #
494 # `last_error` is updated to contains the error information on error, and null on success.
495 fun copy(dest: Path)
496 do
497 last_error = null
498 var input = open_ro
499 var output = dest.open_wo
500
501 while not input.eof do
502 var buffer = input.read_bytes(1024)
503 output.write_bytes buffer
504 end
505
506 input.close
507 output.close
508 last_error = input.last_error or else output.last_error
509 end
510
511 # Open this file for reading.
512 #
513 # ~~~
514 # var file = "/etc/issue".to_path.open_ro
515 # print file.read_line
516 # file.close
517 # ~~~
518 #
519 # Note that it is the user's responsibility to close the stream.
520 # Therefore, for simple use case, look at `read_all` or `each_line`.
521 #
522 # ENSURE `last_error == result.last_error`
523 fun open_ro: FileReader
524 do
525 var res = new FileReader.open(path)
526 last_error = res.last_error
527 return res
528 end
529
530 # Open this file for writing
531 #
532 # ~~~
533 # var file = "bla.log".to_path.open_wo
534 # file.write "Blabla\n"
535 # file.close
536 # ~~~
537 #
538 # Note that it is the user's responsibility to close the stream.
539 # Therefore, for simple use case, look at `Writable::write_to_file`.
540 #
541 # ENSURE `last_error == result.last_error`
542 fun open_wo: FileWriter
543 do
544 var res = new FileWriter.open(path)
545 last_error = res.last_error
546 return res
547 end
548
549 # Read all the content of the file as a string.
550 #
551 # ~~~
552 # var content = "/etc/issue".to_path.read_all
553 # print content
554 # ~~~
555 #
556 # `last_error` is updated to contains the error information on error, and null on success.
557 # In case of error, the result might be empty or truncated.
558 #
559 # See `Reader::read_all` for details.
560 fun read_all: String do return read_all_bytes.to_s
561
562 # Read all the content on the file as a raw sequence of bytes.
563 #
564 # ~~~
565 # var content = "/etc/issue".to_path.read_all_bytes
566 # print content.to_s
567 # ~~~
568 #
569 # `last_error` is updated to contains the error information on error, and null on success.
570 # In case of error, the result might be empty or truncated.
571 fun read_all_bytes: Bytes
572 do
573 var s = open_ro
574 var res = s.read_all_bytes
575 s.close
576 last_error = s.last_error
577 return res
578 end
579
580 # Read all the lines of the file
581 #
582 # ~~~
583 # var lines = "/etc/passwd".to_path.read_lines
584 #
585 # print "{lines.length} users"
586 #
587 # for l in lines do
588 # var fields = l.split(":")
589 # print "name={fields[0]} uid={fields[2]}"
590 # end
591 # ~~~
592 #
593 # `last_error` is updated to contains the error information on error, and null on success.
594 # In case of error, the result might be empty or truncated.
595 #
596 # See `Reader::read_lines` for details.
597 fun read_lines: Array[String]
598 do
599 var s = open_ro
600 var res = s.read_lines
601 s.close
602 last_error = s.last_error
603 return res
604 end
605
606 # Return an iterator on each line of the file
607 #
608 # ~~~
609 # for l in "/etc/passwd".to_path.each_line do
610 # var fields = l.split(":")
611 # print "name={fields[0]} uid={fields[2]}"
612 # end
613 # ~~~
614 #
615 # Note: the stream is automatically closed at the end of the file (see `LineIterator::close_on_finish`)
616 #
617 # `last_error` is updated to contains the error information on error, and null on success.
618 #
619 # See `Reader::each_line` for details.
620 fun each_line: LineIterator
621 do
622 var s = open_ro
623 var res = s.each_line
624 res.close_on_finish = true
625 last_error = s.last_error
626 return res
627 end
628
629
630 # Lists the files contained within the directory at `path`.
631 #
632 # var files = "/etc".to_path.files
633 # assert files.has("/etc/issue".to_path)
634 #
635 # `last_error` is updated to contains the error information on error, and null on success.
636 # In case of error, the result might be empty or truncated.
637 #
638 # var path = "/etc/issue".to_path
639 # files = path.files
640 # assert files.is_empty
641 # assert path.last_error != null
642 fun files: Array[Path]
643 do
644 last_error = null
645 var res = new Array[Path]
646 var d = new NativeDir.opendir(path.to_cstring)
647 if d.address_is_null then
648 last_error = new IOError("Cannot list directory `{path}`: {sys.errno.strerror}")
649 return res
650 end
651
652 loop
653 var de = d.readdir
654 if de.address_is_null then
655 # readdir cannot fail, so null means end of list
656 break
657 end
658 var name = de.to_s_with_copy
659 if name == "." or name == ".." then continue
660 res.add new Path(path / name)
661 end
662 d.closedir
663
664 return res
665 end
666
667 # Is `self` the path to an existing directory ?
668 #
669 # ~~~nit
670 # assert ".".to_path.is_dir
671 # assert not "/etc/issue".to_path.is_dir
672 # assert not "/should/not/exist".to_path.is_dir
673 # ~~~
674 fun is_dir: Bool do
675 var st = stat
676 if st == null then return false
677 return st.is_dir
678 end
679
680 # Delete a directory and all of its content
681 #
682 # Does not go through symbolic links and may get stuck in a cycle if there
683 # is a cycle in the file system.
684 #
685 # `last_error` is updated to contains the error information on error, and null on success.
686 # The method does not stop on the first error and try to remove most file and directories.
687 #
688 # ~~~
689 # var path = "/does/not/exists/".to_path
690 # path.rmdir
691 # assert path.last_error != null
692 # ~~~
693 fun rmdir
694 do
695 last_error = null
696 for file in self.files do
697 var stat = file.link_stat
698 if stat == null then
699 last_error = file.last_error
700 continue
701 end
702 if stat.is_dir then
703 # Recursively rmdir
704 file.rmdir
705 else
706 file.delete
707 end
708 if last_error == null then last_error = file.last_error
709 end
710
711 # Delete the directory itself if things are fine
712 if last_error == null then
713 if path.to_cstring.rmdir then
714 last_error = new IOError("Cannot remove `{self}`: {sys.errno.strerror}")
715 end
716 end
717 end
718
719 redef fun ==(other) do return other isa Path and simplified.path == other.simplified.path
720 redef fun hash do return simplified.path.hash
721 end
722
723 # Information on a file
724 #
725 # Created by `Path::stat` and `Path::link_stat`.
726 #
727 # The information within this class is gathered when the instance is initialized
728 # it will not be updated if the targeted file is modified.
729 class FileStat
730 super Finalizable
731
732 # TODO private init
733
734 # The low-level status of a file
735 #
736 # See: POSIX stat(2)
737 private var stat: NativeFileStat
738
739 private var finalized = false
740
741 redef fun finalize
742 do
743 if not finalized then
744 stat.free
745 finalized = true
746 end
747 end
748
749 # Returns the last access time in seconds since Epoch
750 fun last_access_time: Int
751 do
752 assert not finalized
753 return stat.atime
754 end
755
756 # Returns the last access time
757 #
758 # alias for `last_access_time`
759 fun atime: Int do return last_access_time
760
761 # Returns the last modification time in seconds since Epoch
762 fun last_modification_time: Int
763 do
764 assert not finalized
765 return stat.mtime
766 end
767
768 # Returns the last modification time
769 #
770 # alias for `last_modification_time`
771 fun mtime: Int do return last_modification_time
772
773
774 # Size of the file at `path`
775 fun size: Int
776 do
777 assert not finalized
778 return stat.size
779 end
780
781 # Is self a regular file and not a device file, pipe, socket, etc.?
782 fun is_file: Bool
783 do
784 assert not finalized
785 return stat.is_reg
786 end
787
788 # Alias for `is_file`
789 fun is_reg: Bool do return is_file
790
791 # Is this a directory?
792 fun is_dir: Bool
793 do
794 assert not finalized
795 return stat.is_dir
796 end
797
798 # Is this a symbolic link?
799 fun is_link: Bool
800 do
801 assert not finalized
802 return stat.is_lnk
803 end
804
805 # FIXME Make the following POSIX only? or implement in some other way on Windows
806
807 # Returns the last status change time in seconds since Epoch
808 fun last_status_change_time: Int
809 do
810 assert not finalized
811 return stat.ctime
812 end
813
814 # Returns the last status change time
815 #
816 # alias for `last_status_change_time`
817 fun ctime: Int do return last_status_change_time
818
819 # Returns the permission bits of file
820 fun mode: Int
821 do
822 assert not finalized
823 return stat.mode
824 end
825
826 # Is this a character device?
827 fun is_chr: Bool
828 do
829 assert not finalized
830 return stat.is_chr
831 end
832
833 # Is this a block device?
834 fun is_blk: Bool
835 do
836 assert not finalized
837 return stat.is_blk
838 end
839
840 # Is this a FIFO pipe?
841 fun is_fifo: Bool
842 do
843 assert not finalized
844 return stat.is_fifo
845 end
846
847 # Is this a UNIX socket
848 fun is_sock: Bool
849 do
850 assert not finalized
851 return stat.is_sock
852 end
853 end
854
855 redef class Text
856 # Access file system related services on the path at `self`
857 fun to_path: Path do return new Path(to_s)
858
859 private fun write_native_to(s: FileWriter)
860 do
861 for i in substrings do s.write_native(i.to_cstring, 0, i.bytelen)
862 end
863 end
864
865 redef class String
866 # return true if a file with this names exists
867 fun file_exists: Bool do return to_cstring.file_exists
868
869 # The status of a file. see POSIX stat(2).
870 fun file_stat: nullable FileStat
871 do
872 var stat = to_cstring.file_stat
873 if stat.address_is_null then return null
874 return new FileStat(stat)
875 end
876
877 # The status of a file or of a symlink. see POSIX lstat(2).
878 fun file_lstat: nullable FileStat
879 do
880 var stat = to_cstring.file_lstat
881 if stat.address_is_null then return null
882 return new FileStat(stat)
883 end
884
885 # Remove a file, return true if success
886 fun file_delete: Bool do return to_cstring.file_delete
887
888 # Copy content of file at `self` to `dest`
889 fun file_copy_to(dest: String) do to_path.copy(dest.to_path)
890
891 # Remove the trailing `extension`.
892 #
893 # `extension` usually starts with a dot but could be anything.
894 #
895 # assert "file.txt".strip_extension(".txt") == "file"
896 # assert "file.txt".strip_extension("le.txt") == "fi"
897 # assert "file.txt".strip_extension("xt") == "file.t"
898 #
899 # If `extension == null`, the rightmost extension is stripped, including the last dot.
900 #
901 # assert "file.txt".strip_extension == "file"
902 #
903 # If `extension` is not present, `self` is returned unmodified.
904 #
905 # assert "file.txt".strip_extension(".tar.gz") == "file.txt"
906 fun strip_extension(extension: nullable String): String
907 do
908 if extension == null then
909 extension = file_extension
910 if extension == null then
911 return self
912 else extension = ".{extension}"
913 end
914
915 if has_suffix(extension) then
916 return substring(0, length - extension.length)
917 end
918 return self
919 end
920
921 # Extract the basename of a path and strip the `extension`
922 #
923 # The extension is stripped only if `extension != null`.
924 #
925 # assert "/path/to/a_file.ext".basename(".ext") == "a_file"
926 # assert "path/to/a_file.ext".basename(".ext") == "a_file"
927 # assert "path/to/a_file.ext".basename == "a_file.ext"
928 # assert "path/to".basename(".ext") == "to"
929 # assert "path/to/".basename(".ext") == "to"
930 # assert "path/to".basename == "to"
931 # assert "path".basename("") == "path"
932 # assert "/path".basename("") == "path"
933 # assert "/".basename("") == "/"
934 # assert "".basename("") == ""
935 fun basename(extension: nullable String): String
936 do
937 var l = length - 1 # Index of the last char
938 while l > 0 and self.chars[l] == '/' do l -= 1 # remove all trailing `/`
939 if l == 0 then return "/"
940 var pos = chars.last_index_of_from('/', l)
941 var n = self
942 if pos >= 0 then
943 n = substring(pos+1, l-pos)
944 end
945
946 if extension != null then
947 return n.strip_extension(extension)
948 else return n
949 end
950
951 # Extract the dirname of a path
952 #
953 # assert "/path/to/a_file.ext".dirname == "/path/to"
954 # assert "path/to/a_file.ext".dirname == "path/to"
955 # assert "path/to".dirname == "path"
956 # assert "path/to/".dirname == "path"
957 # assert "path".dirname == "."
958 # assert "/path".dirname == "/"
959 # assert "/".dirname == "/"
960 # assert "".dirname == "."
961 fun dirname: String
962 do
963 var l = length - 1 # Index of the last char
964 while l > 0 and self.chars[l] == '/' do l -= 1 # remove all trailing `/`
965 var pos = chars.last_index_of_from('/', l)
966 if pos > 0 then
967 return substring(0, pos)
968 else if pos == 0 then
969 return "/"
970 else
971 return "."
972 end
973 end
974
975 # Return the canonicalized absolute pathname (see POSIX function `realpath`)
976 #
977 # Require: `file_exists`
978 fun realpath: String do
979 var cs = to_cstring.file_realpath
980 assert file_exists
981 var res = cs.to_s_with_copy
982 cs.free
983 return res
984 end
985
986 # Simplify a file path by remove useless `.`, removing `//`, and resolving `..`
987 #
988 # * `..` are not resolved if they start the path
989 # * starting `.` is simplified unless the path is empty
990 # * starting `/` is not removed
991 # * trailing `/` is removed
992 #
993 # Note that the method only work on the string:
994 #
995 # * no I/O access is performed
996 # * the validity of the path is not checked
997 #
998 # ~~~
999 # assert "some/./complex/../../path/from/../to/a////file//".simplify_path == "path/to/a/file"
1000 # assert "../dir/file".simplify_path == "../dir/file"
1001 # assert "dir/../../".simplify_path == ".."
1002 # assert "dir/..".simplify_path == "."
1003 # assert "//absolute//path/".simplify_path == "/absolute/path"
1004 # assert "//absolute//../".simplify_path == "/"
1005 # assert "/".simplify_path == "/"
1006 # assert "../".simplify_path == ".."
1007 # assert "./".simplify_path == "."
1008 # assert "././././././".simplify_path == "."
1009 # assert "./../dir".simplify_path == "../dir"
1010 # assert "./dir".simplify_path == "dir"
1011 # ~~~
1012 fun simplify_path: String
1013 do
1014 var a = self.split_with("/")
1015 var a2 = new Array[String]
1016 for x in a do
1017 if x == "." and not a2.is_empty then continue # skip `././`
1018 if x == "" and not a2.is_empty then continue # skip `//`
1019 if x == ".." and not a2.is_empty and a2.last != ".." then
1020 if a2.last == "." then # do not skip `./../`
1021 a2.pop # reduce `./../` in `../`
1022 else # reduce `dir/../` in `/`
1023 a2.pop
1024 continue
1025 end
1026 else if not a2.is_empty and a2.last == "." then
1027 a2.pop # reduce `./dir` in `dir`
1028 end
1029 a2.push(x)
1030 end
1031 if a2.is_empty then return "."
1032 if a2.length == 1 and a2.first == "" then return "/"
1033 return a2.join("/")
1034 end
1035
1036 # Correctly join two path using the directory separator.
1037 #
1038 # Using a standard "{self}/{path}" does not work in the following cases:
1039 #
1040 # * `self` is empty.
1041 # * `path` starts with `'/'`.
1042 #
1043 # This method ensures that the join is valid.
1044 #
1045 # assert "hello".join_path("world") == "hello/world"
1046 # assert "hel/lo".join_path("wor/ld") == "hel/lo/wor/ld"
1047 # assert "".join_path("world") == "world"
1048 # assert "hello".join_path("/world") == "/world"
1049 # assert "hello/".join_path("world") == "hello/world"
1050 # assert "hello/".join_path("/world") == "/world"
1051 #
1052 # Note: You may want to use `simplify_path` on the result.
1053 #
1054 # Note: This method works only with POSIX paths.
1055 fun join_path(path: String): String
1056 do
1057 if path.is_empty then return self
1058 if self.is_empty then return path
1059 if path.chars[0] == '/' then return path
1060 if self.last == '/' then return "{self}{path}"
1061 return "{self}/{path}"
1062 end
1063
1064 # Convert the path (`self`) to a program name.
1065 #
1066 # Ensure the path (`self`) will be treated as-is by POSIX shells when it is
1067 # used as a program name. In order to do that, prepend `./` if needed.
1068 #
1069 # assert "foo".to_program_name == "./foo"
1070 # assert "/foo".to_program_name == "/foo"
1071 # assert "".to_program_name == "./" # At least, your shell will detect the error.
1072 fun to_program_name: String do
1073 if self.has_prefix("/") then
1074 return self
1075 else
1076 return "./{self}"
1077 end
1078 end
1079
1080 # Alias for `join_path`
1081 #
1082 # assert "hello" / "world" == "hello/world"
1083 # assert "hel/lo" / "wor/ld" == "hel/lo/wor/ld"
1084 # assert "" / "world" == "world"
1085 # assert "/hello" / "/world" == "/world"
1086 #
1087 # This operator is quite useful for chaining changes of path.
1088 # The next one being relative to the previous one.
1089 #
1090 # var a = "foo"
1091 # var b = "/bar"
1092 # var c = "baz/foobar"
1093 # assert a/b/c == "/bar/baz/foobar"
1094 fun /(path: String): String do return join_path(path)
1095
1096 # Returns the relative path needed to go from `self` to `dest`.
1097 #
1098 # assert "/foo/bar".relpath("/foo/baz") == "../baz"
1099 # assert "/foo/bar".relpath("/baz/bar") == "../../baz/bar"
1100 #
1101 # If `self` or `dest` is relative, they are considered relatively to `getcwd`.
1102 #
1103 # In some cases, the result is still independent of the current directory:
1104 #
1105 # assert "foo/bar".relpath("..") == "../../.."
1106 #
1107 # In other cases, parts of the current directory may be exhibited:
1108 #
1109 # var p = "../foo/bar".relpath("baz")
1110 # var c = getcwd.basename
1111 # assert p == "../../{c}/baz"
1112 #
1113 # For path resolution independent of the current directory (eg. for paths in URL),
1114 # or to use an other starting directory than the current directory,
1115 # just force absolute paths:
1116 #
1117 # var start = "/a/b/c/d"
1118 # var p2 = (start/"../foo/bar").relpath(start/"baz")
1119 # assert p2 == "../../d/baz"
1120 #
1121 #
1122 # Neither `self` or `dest` has to be real paths or to exist in directories since
1123 # the resolution is only done with string manipulations and without any access to
1124 # the underlying file system.
1125 #
1126 # If `self` and `dest` are the same directory, the empty string is returned:
1127 #
1128 # assert "foo".relpath("foo") == ""
1129 # assert "foo/../bar".relpath("bar") == ""
1130 #
1131 # The empty string and "." designate both the current directory:
1132 #
1133 # assert "".relpath("foo/bar") == "foo/bar"
1134 # assert ".".relpath("foo/bar") == "foo/bar"
1135 # assert "foo/bar".relpath("") == "../.."
1136 # assert "/" + "/".relpath(".") == getcwd
1137 fun relpath(dest: String): String
1138 do
1139 var cwd = getcwd
1140 var from = (cwd/self).simplify_path.split("/")
1141 if from.last.is_empty then from.pop # case for the root directory
1142 var to = (cwd/dest).simplify_path.split("/")
1143 if to.last.is_empty then to.pop # case for the root directory
1144
1145 # Remove common prefixes
1146 while not from.is_empty and not to.is_empty and from.first == to.first do
1147 from.shift
1148 to.shift
1149 end
1150
1151 # Result is going up in `from` with ".." then going down following `to`
1152 var from_len = from.length
1153 if from_len == 0 then return to.join("/")
1154 var up = "../"*(from_len-1) + ".."
1155 if to.is_empty then return up
1156 var res = up + "/" + to.join("/")
1157 return res
1158 end
1159
1160 # Create a directory (and all intermediate directories if needed)
1161 #
1162 # The optional `mode` parameter specifies the permissions of the directory,
1163 # the default value is `0o777`.
1164 #
1165 # Return an error object in case of error.
1166 #
1167 # assert "/etc/".mkdir != null
1168 fun mkdir(mode: nullable Int): nullable Error
1169 do
1170 mode = mode or else 0o777
1171
1172 var dirs = self.split_with("/")
1173 var path = new FlatBuffer
1174 if dirs.is_empty then return null
1175 if dirs[0].is_empty then
1176 # it was a starting /
1177 path.add('/')
1178 end
1179 var error: nullable Error = null
1180 for d in dirs do
1181 if d.is_empty then continue
1182 path.append(d)
1183 path.add('/')
1184 var res = path.to_s.to_cstring.file_mkdir(mode)
1185 if not res and error == null then
1186 error = new IOError("Cannot create directory `{path}`: {sys.errno.strerror}")
1187 end
1188 end
1189 return error
1190 end
1191
1192 # Delete a directory and all of its content, return `true` on success
1193 #
1194 # Does not go through symbolic links and may get stuck in a cycle if there
1195 # is a cycle in the filesystem.
1196 #
1197 # Return an error object in case of error.
1198 #
1199 # assert "/fail/does not/exist".rmdir != null
1200 fun rmdir: nullable Error
1201 do
1202 var p = to_path
1203 p.rmdir
1204 return p.last_error
1205 end
1206
1207 # Change the current working directory
1208 #
1209 # "/etc".chdir
1210 # assert getcwd == "/etc"
1211 # "..".chdir
1212 # assert getcwd == "/"
1213 #
1214 # Return an error object in case of error.
1215 #
1216 # assert "/etc".chdir == null
1217 # assert "/fail/does no/exist".chdir != null
1218 # assert getcwd == "/etc" # unchanger
1219 fun chdir: nullable Error
1220 do
1221 var res = to_cstring.file_chdir
1222 if res then return null
1223 var error = new IOError("Cannot change directory to `{self}`: {sys.errno.strerror}")
1224 return error
1225 end
1226
1227 # Return right-most extension (without the dot)
1228 #
1229 # Only the last extension is returned.
1230 # There is no special case for combined extensions.
1231 #
1232 # assert "file.txt".file_extension == "txt"
1233 # assert "file.tar.gz".file_extension == "gz"
1234 #
1235 # For file without extension, `null` is returned.
1236 # Hoever, for trailing dot, `""` is returned.
1237 #
1238 # assert "file".file_extension == null
1239 # assert "file.".file_extension == ""
1240 #
1241 # The starting dot of hidden files is never considered.
1242 #
1243 # assert ".file.txt".file_extension == "txt"
1244 # assert ".file".file_extension == null
1245 fun file_extension: nullable String
1246 do
1247 var last_slash = chars.last_index_of('.')
1248 if last_slash > 0 then
1249 return substring( last_slash+1, length )
1250 else
1251 return null
1252 end
1253 end
1254
1255 # Returns entries contained within the directory represented by self.
1256 #
1257 # var files = "/etc".files
1258 # assert files.has("issue")
1259 #
1260 # Returns an empty array in case of error
1261 #
1262 # files = "/etc/issue".files
1263 # assert files.is_empty
1264 #
1265 # TODO find a better way to handle errors and to give them back to the user.
1266 fun files: Array[String]
1267 do
1268 var res = new Array[String]
1269 var d = new NativeDir.opendir(to_cstring)
1270 if d.address_is_null then return res
1271
1272 loop
1273 var de = d.readdir
1274 if de.address_is_null then break
1275 var name = de.to_s_with_copy
1276 if name == "." or name == ".." then continue
1277 res.add name
1278 end
1279 d.closedir
1280
1281 return res
1282 end
1283 end
1284
1285 redef class FlatString
1286 redef fun write_native_to(s)
1287 do
1288 s.write_native(items, first_byte, bytelen)
1289 end
1290
1291 redef fun file_extension do
1292 var its = _items
1293 var p = last_byte
1294 var c = its[p]
1295 var st = _first_byte
1296 while p >= st and c != '.'.ascii do
1297 p -= 1
1298 c = its[p]
1299 end
1300 if p <= st then return null
1301 var ls = last_byte
1302 return new FlatString.with_infos(its, ls - p, p + 1)
1303 end
1304
1305 redef fun basename(extension) do
1306 var l = last_byte
1307 var its = _items
1308 var min = _first_byte
1309 var sl = '/'.ascii
1310 while l > min and its[l] == sl do l -= 1
1311 if l == min then return "/"
1312 var ns = l
1313 while ns >= min and its[ns] != sl do ns -= 1
1314 var bname = new FlatString.with_infos(its, l - ns, ns + 1)
1315
1316 return if extension != null then bname.strip_extension(extension) else bname
1317 end
1318 end
1319
1320 redef class NativeString
1321 private fun file_exists: Bool `{
1322 FILE *hdl = fopen(self,"r");
1323 if(hdl != NULL){
1324 fclose(hdl);
1325 }
1326 return hdl != NULL;
1327 `}
1328
1329 private fun file_stat: NativeFileStat `{
1330 struct stat buff;
1331 if(stat(self, &buff) != -1) {
1332 struct stat* stat_element;
1333 stat_element = malloc(sizeof(struct stat));
1334 return memcpy(stat_element, &buff, sizeof(struct stat));
1335 }
1336 return 0;
1337 `}
1338
1339 private fun file_lstat: NativeFileStat `{
1340 struct stat* stat_element;
1341 int res;
1342 stat_element = malloc(sizeof(struct stat));
1343 res = lstat(self, stat_element);
1344 if (res == -1) return NULL;
1345 return stat_element;
1346 `}
1347
1348 private fun file_mkdir(mode: Int): Bool `{ return !mkdir(self, mode); `}
1349
1350 private fun rmdir: Bool `{ return !rmdir(self); `}
1351
1352 private fun file_delete: Bool `{
1353 return remove(self) == 0;
1354 `}
1355
1356 private fun file_chdir: Bool `{ return !chdir(self); `}
1357
1358 private fun file_realpath: NativeString `{ return realpath(self, NULL); `}
1359 end
1360
1361 # This class is system dependent ... must reify the vfs
1362 private extern class NativeFileStat `{ struct stat * `}
1363
1364 # Returns the permission bits of file
1365 fun mode: Int `{ return self->st_mode; `}
1366
1367 # Returns the last access time
1368 fun atime: Int `{ return self->st_atime; `}
1369
1370 # Returns the last status change time
1371 fun ctime: Int `{ return self->st_ctime; `}
1372
1373 # Returns the last modification time
1374 fun mtime: Int `{ return self->st_mtime; `}
1375
1376 # Returns the size
1377 fun size: Int `{ return self->st_size; `}
1378
1379 # Returns true if it is a regular file (not a device file, pipe, sockect, ...)
1380 fun is_reg: Bool `{ return S_ISREG(self->st_mode); `}
1381
1382 # Returns true if it is a directory
1383 fun is_dir: Bool `{ return S_ISDIR(self->st_mode); `}
1384
1385 # Returns true if it is a character device
1386 fun is_chr: Bool `{ return S_ISCHR(self->st_mode); `}
1387
1388 # Returns true if it is a block device
1389 fun is_blk: Bool `{ return S_ISBLK(self->st_mode); `}
1390
1391 # Returns true if the type is fifo
1392 fun is_fifo: Bool `{ return S_ISFIFO(self->st_mode); `}
1393
1394 # Returns true if the type is a link
1395 fun is_lnk: Bool `{ return S_ISLNK(self->st_mode); `}
1396
1397 # Returns true if the type is a socket
1398 fun is_sock: Bool `{ return S_ISSOCK(self->st_mode); `}
1399 end
1400
1401 # Instance of this class are standard FILE * pointers
1402 private extern class NativeFile `{ FILE* `}
1403 fun io_read(buf: NativeString, len: Int): Int `{
1404 return fread(buf, 1, len, self);
1405 `}
1406
1407 fun io_write(buf: NativeString, from, len: Int): Int `{
1408 return fwrite(buf+from, 1, len, self);
1409 `}
1410
1411 fun write_byte(value: Byte): Int `{
1412 unsigned char b = (unsigned char)value;
1413 return fwrite(&b, 1, 1, self);
1414 `}
1415
1416 fun io_close: Int `{ return fclose(self); `}
1417
1418 fun file_stat: NativeFileStat `{
1419 struct stat buff;
1420 if(fstat(fileno(self), &buff) != -1) {
1421 struct stat* stat_element;
1422 stat_element = malloc(sizeof(struct stat));
1423 return memcpy(stat_element, &buff, sizeof(struct stat));
1424 }
1425 return 0;
1426 `}
1427
1428 fun ferror: Bool `{ return ferror(self); `}
1429
1430 fun fileno: Int `{ return fileno(self); `}
1431
1432 # Flushes the buffer, forcing the write operation
1433 fun flush: Int `{ return fflush(self); `}
1434
1435 # Used to specify how the buffering will be handled for the current stream.
1436 fun set_buffering_type(buf_length, mode: Int): Int `{
1437 return setvbuf(self, NULL, (int)mode, buf_length);
1438 `}
1439
1440 new io_open_read(path: NativeString) `{ return fopen(path, "r"); `}
1441
1442 new io_open_write(path: NativeString) `{ return fopen(path, "w"); `}
1443
1444 new native_stdin `{ return stdin; `}
1445
1446 new native_stdout `{ return stdout; `}
1447
1448 new native_stderr `{ return stderr; `}
1449 end
1450
1451 # Standard `DIR*` pointer
1452 private extern class NativeDir `{ DIR* `}
1453
1454 # Open a directory
1455 new opendir(path: NativeString) `{ return opendir(path); `}
1456
1457 # Close a directory
1458 fun closedir `{ closedir(self); `}
1459
1460 # Read the next directory entry
1461 fun readdir: NativeString `{
1462 struct dirent *de;
1463 de = readdir(self);
1464 if (!de) return NULL;
1465 return de->d_name;
1466 `}
1467 end
1468
1469 redef class Sys
1470
1471 # Standard input
1472 var stdin: PollableReader = new Stdin is protected writable, lazy
1473
1474 # Standard output
1475 var stdout: Writer = new Stdout is protected writable, lazy
1476
1477 # Standard output for errors
1478 var stderr: Writer = new Stderr is protected writable, lazy
1479
1480 # Enumeration for buffer mode full (flushes when buffer is full)
1481 fun buffer_mode_full: Int `{ return _IOFBF; `}
1482
1483 # Enumeration for buffer mode line (flushes when a `\n` is encountered)
1484 fun buffer_mode_line: Int `{ return _IONBF; `}
1485
1486 # Enumeration for buffer mode none (flushes ASAP when something is written)
1487 fun buffer_mode_none: Int `{ return _IOLBF; `}
1488
1489 # returns first available stream to read or write to
1490 # return null on interruption (possibly a signal)
1491 protected fun poll( streams : Sequence[FileStream] ) : nullable FileStream
1492 do
1493 var in_fds = new Array[Int]
1494 var out_fds = new Array[Int]
1495 var fd_to_stream = new HashMap[Int,FileStream]
1496 for s in streams do
1497 var fd = s.fd
1498 if s isa FileReader then in_fds.add( fd )
1499 if s isa FileWriter then out_fds.add( fd )
1500
1501 fd_to_stream[fd] = s
1502 end
1503
1504 var polled_fd = intern_poll( in_fds, out_fds )
1505
1506 if polled_fd == null then
1507 return null
1508 else
1509 return fd_to_stream[polled_fd]
1510 end
1511 end
1512
1513 private fun intern_poll(in_fds: Array[Int], out_fds: Array[Int]): nullable Int
1514 import Array[Int].length, Array[Int].[], Int.as(nullable Int) `{
1515 int in_len, out_len, total_len;
1516 struct pollfd *c_fds;
1517 int i;
1518 int first_polled_fd = -1;
1519 int result;
1520
1521 in_len = (int)Array_of_Int_length( in_fds );
1522 out_len = (int)Array_of_Int_length( out_fds );
1523 total_len = in_len + out_len;
1524 c_fds = malloc( sizeof(struct pollfd) * total_len );
1525
1526 /* input streams */
1527 for ( i=0; i<in_len; i ++ ) {
1528 int fd = (int)Array_of_Int__index( in_fds, i );
1529
1530 c_fds[i].fd = fd;
1531 c_fds[i].events = POLLIN;
1532 }
1533
1534 /* output streams */
1535 for ( i=0; i<out_len; i ++ ) {
1536 int fd = (int)Array_of_Int__index( out_fds, i );
1537
1538 c_fds[i].fd = fd;
1539 c_fds[i].events = POLLOUT;
1540 }
1541
1542 /* poll all fds, unlimited timeout */
1543 result = poll( c_fds, total_len, -1 );
1544
1545 if ( result > 0 ) {
1546 /* analyse results */
1547 for ( i=0; i<total_len; i++ )
1548 if ( c_fds[i].revents & c_fds[i].events || /* awaited event */
1549 c_fds[i].revents & POLLHUP ) /* closed */
1550 {
1551 first_polled_fd = c_fds[i].fd;
1552 break;
1553 }
1554
1555 return Int_as_nullable( first_polled_fd );
1556 }
1557 else if ( result < 0 )
1558 fprintf( stderr, "Error in Stream:poll: %s\n", strerror( errno ) );
1559
1560 return null_Int();
1561 `}
1562
1563 end
1564
1565 # Print `objects` on the standard output (`stdout`).
1566 fun printn(objects: Object...)
1567 do
1568 sys.stdout.write(objects.plain_to_s)
1569 end
1570
1571 # Print an `object` on the standard output (`stdout`) and add a newline.
1572 fun print(object: Object)
1573 do
1574 sys.stdout.write(object.to_s)
1575 sys.stdout.write("\n")
1576 end
1577
1578 # Print `object` on the error output (`stderr` or a log system)
1579 fun print_error(object: Object)
1580 do
1581 sys.stderr.write object.to_s
1582 sys.stderr.write "\n"
1583 end
1584
1585 # Read a character from the standard input (`stdin`).
1586 fun getc: Char
1587 do
1588 var c = sys.stdin.read_char
1589 if c == null then return '\1'
1590 return c
1591 end
1592
1593 # Read a line from the standard input (`stdin`).
1594 fun gets: String
1595 do
1596 return sys.stdin.read_line
1597 end
1598
1599 # Return the working (current) directory
1600 fun getcwd: String do return native_getcwd.to_s
1601
1602 private fun native_getcwd: NativeString `{ return getcwd(NULL, 0); `}