lib/file: document and fix `file_extension`
[nit.git] / lib / standard / file.nit
1 # This file is part of NIT ( http://www.nitlanguage.org ).
2 #
3 # Copyright 2004-2008 Jean Privat <jean@pryen.org>
4 # Copyright 2008 Floréal Morandat <morandat@lirmm.fr>
5 # Copyright 2008 Jean-Sébastien Gélinas <calestar@gmail.com>
6 #
7 # This file is free software, which comes along with NIT. This software is
8 # distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
9 # without even the implied warranty of MERCHANTABILITY or FITNESS FOR A
10 # PARTICULAR PURPOSE. You can modify it is you want, provided this header
11 # is kept unaltered, and a notification of the changes is added.
12 # You are allowed to redistribute it and sell it, alone or is a part of
13 # another product.
14
15 # File manipulations (create, read, write, etc.)
16 module file
17
18 intrude import stream
19 intrude import string
20 import string_search
21 import time
22
23 in "C Header" `{
24 #include <dirent.h>
25 #include <string.h>
26 #include <sys/types.h>
27 #include <sys/stat.h>
28 #include <unistd.h>
29 `}
30
31 redef class Object
32 # Simple I/O
33
34 # Print `objects` on the standard output (`stdout`).
35 protected fun printn(objects: Object...)
36 do
37 stdout.write(objects.to_s)
38 end
39
40 # Print an `object` on the standard output (`stdout`) and add a newline.
41 protected fun print(object: Object)
42 do
43 stdout.write(object.to_s)
44 stdout.write("\n")
45 end
46
47 # Read a character from the standard input (`stdin`).
48 protected fun getc: Char
49 do
50 return stdin.read_char.ascii
51 end
52
53 # Read a line from the standard input (`stdin`).
54 protected fun gets: String
55 do
56 return stdin.read_line
57 end
58
59 # Return the working (current) directory
60 protected fun getcwd: String do return file_getcwd.to_s
61 private fun file_getcwd: NativeString is extern "string_NativeString_NativeString_file_getcwd_0"
62 end
63
64 # File Abstract Stream
65 abstract class FStream
66 super IOS
67 # The path of the file.
68 readable var _path: nullable String = null
69
70 # The FILE *.
71 var _file: nullable NativeFile = null
72
73 fun file_stat: FileStat
74 do return _file.file_stat end
75 end
76
77 # File input stream
78 class IFStream
79 super FStream
80 super BufferedIStream
81 # Misc
82
83 # Open the same file again.
84 # The original path is reused, therefore the reopened file can be a different file.
85 fun reopen
86 do
87 if not eof then close
88 _file = new NativeFile.io_open_read(_path.to_cstring)
89 _end_reached = false
90 _buffer_pos = 0
91 _buffer.clear
92 end
93
94 redef fun close
95 do
96 var i = _file.io_close
97 _end_reached = true
98 end
99
100 redef fun fill_buffer
101 do
102 var nb = _file.io_read(_buffer._items, _buffer._capacity)
103 if nb <= 0 then
104 _end_reached = true
105 nb = 0
106 end
107 _buffer._length = nb
108 _buffer_pos = 0
109 end
110
111 # End of file?
112 redef readable var _end_reached: Bool = false
113
114 # Open the file at `path` for reading.
115 init open(path: String)
116 do
117 _path = path
118 prepare_buffer(10)
119 _file = new NativeFile.io_open_read(_path.to_cstring)
120 assert cant_open_file: _file != null
121 end
122
123 private init do end
124 private init without_file do end
125 end
126
127 # File output stream
128 class OFStream
129 super FStream
130 super OStream
131
132 redef fun write(s)
133 do
134 assert _writable
135 write_native(s.to_cstring, s.length)
136 end
137
138 redef fun is_writable do return _writable
139
140 redef fun close
141 do
142 var i = _file.io_close
143 _writable = false
144 end
145
146 # Is the file open in write mode
147 var _writable: Bool
148
149 # Write `len` bytes from `native`.
150 private fun write_native(native: NativeString, len: Int)
151 do
152 assert _writable
153 var err = _file.io_write(native, len)
154 if err != len then
155 # Big problem
156 printn("Problem in writing : ", err, " ", len, "\n")
157 end
158 end
159
160 # Open the file at `path` for writing.
161 init open(path: String)
162 do
163 _file = new NativeFile.io_open_write(path.to_cstring)
164 assert cant_open_file: _file != null
165 _path = path
166 _writable = true
167 end
168
169 private init do end
170 private init without_file do end
171 end
172
173 ###############################################################################
174
175 class Stdin
176 super IFStream
177 private init do
178 _file = new NativeFile.native_stdin
179 _path = "/dev/stdin"
180 prepare_buffer(1)
181 end
182
183 # Is these something to read? (non blocking)
184 # FIXME: should be generalized
185 fun poll_in: Bool is extern "file_stdin_poll_in"
186 end
187
188 class Stdout
189 super OFStream
190 private init do
191 _file = new NativeFile.native_stdout
192 _path = "/dev/stdout"
193 _writable = true
194 end
195 end
196
197 class Stderr
198 super OFStream
199 private init do
200 _file = new NativeFile.native_stderr
201 _path = "/dev/stderr"
202 _writable = true
203 end
204 end
205
206 ###############################################################################
207
208 redef class Streamable
209 # Like `write_to` but take care of creating the file
210 fun write_to_file(filepath: String)
211 do
212 var stream = new OFStream.open(filepath)
213 write_to(stream)
214 stream.close
215 end
216 end
217
218 redef class String
219 # return true if a file with this names exists
220 fun file_exists: Bool do return to_cstring.file_exists
221
222 fun file_stat: FileStat do return to_cstring.file_stat
223 fun file_lstat: FileStat do return to_cstring.file_lstat
224
225 # Remove a file, return true if success
226 fun file_delete: Bool do return to_cstring.file_delete
227
228 # Copy content of file at `self` to `dest`
229 fun file_copy_to(dest: String)
230 do
231 var input = new IFStream.open(self)
232 var output = new OFStream.open(dest)
233
234 while not input.eof do
235 var buffer = input.read(1024)
236 output.write buffer
237 end
238
239 input.close
240 output.close
241 end
242
243 # remove the trailing extension "ext"
244 fun strip_extension(ext: String): String
245 do
246 if has_suffix(ext) then
247 return substring(0, length - ext.length)
248 end
249 return self
250 end
251
252 # Extract the basename of a path and remove the extension
253 #
254 # assert "/path/to/a_file.ext".basename(".ext") == "a_file"
255 # assert "path/to/a_file.ext".basename(".ext") == "a_file"
256 # assert "path/to".basename(".ext") == "to"
257 # assert "path/to/".basename(".ext") == "to"
258 # assert "path".basename("") == "path"
259 # assert "/path".basename("") == "path"
260 # assert "/".basename("") == "/"
261 # assert "".basename("") == ""
262 fun basename(ext: String): String
263 do
264 var l = _length - 1 # Index of the last char
265 while l > 0 and self.chars[l] == '/' do l -= 1 # remove all trailing `/`
266 if l == 0 then return "/"
267 var pos = last_index_of_from('/', l)
268 var n = self
269 if pos >= 0 then
270 n = substring(pos+1, l-pos)
271 end
272 return n.strip_extension(ext)
273 end
274
275 # Extract the dirname of a path
276 #
277 # assert "/path/to/a_file.ext".dirname == "/path/to"
278 # assert "path/to/a_file.ext".dirname == "path/to"
279 # assert "path/to".dirname == "path"
280 # assert "path/to/".dirname == "path"
281 # assert "path".dirname == "."
282 # assert "/path".dirname == "/"
283 # assert "/".dirname == "/"
284 # assert "".dirname == "."
285 fun dirname: String
286 do
287 var l = _length - 1 # Index of the last char
288 while l > 0 and self.chars[l] == '/' do l -= 1 # remove all trailing `/`
289 var pos = last_index_of_from('/', l)
290 if pos > 0 then
291 return substring(0, pos)
292 else if pos == 0 then
293 return "/"
294 else
295 return "."
296 end
297 end
298
299 # Return the canonicalized absolute pathname (see POSIX function `realpath`)
300 fun realpath: String do
301 var cs = to_cstring.file_realpath
302 var res = cs.to_s_with_copy
303 # cs.free_malloc # FIXME memory leak
304 return res
305 end
306
307 # Simplify a file path by remove useless ".", removing "//", and resolving ".."
308 # ".." are not resolved if they start the path
309 # starting "/" is not removed
310 # trainling "/" is removed
311 #
312 # Note that the method only wonrk on the string:
313 # * no I/O access is performed
314 # * the validity of the path is not checked
315 #
316 # assert "some/./complex/../../path/from/../to/a////file//".simplify_path == "path/to/a/file"
317 # assert "../dir/file".simplify_path == "../dir/file"
318 # assert "dir/../../".simplify_path == ".."
319 # assert "dir/..".simplify_path == "."
320 # assert "//absolute//path/".simplify_path == "/absolute/path"
321 fun simplify_path: String
322 do
323 var a = self.split_with("/")
324 var a2 = new Array[String]
325 for x in a do
326 if x == "." then continue
327 if x == "" and not a2.is_empty then continue
328 if x == ".." and not a2.is_empty and a2.last != ".." then
329 a2.pop
330 continue
331 end
332 a2.push(x)
333 end
334 if a2.is_empty then return "."
335 return a2.join("/")
336 end
337
338 # Correctly join two path using the directory separator.
339 #
340 # Using a standard "{self}/{path}" does not work when `self` is the empty string.
341 # This method ensure that the join is valid.
342 #
343 # assert "hello".join_path("world") == "hello/world"
344 # assert "hel/lo".join_path("wor/ld") == "hel/lo/wor/ld"
345 # assert "".join_path("world") == "world"
346 # assert "/hello".join_path("/world") == "/world"
347 #
348 # Note: you may want to use `simplify_path` on the result
349 #
350 # Note: I you want to join a great number of path, you can write
351 #
352 # [p1, p2, p3, p4].join("/")
353 fun join_path(path: String): String
354 do
355 if path.is_empty then return self
356 if self.is_empty then return path
357 if path.chars[0] == '/' then return path
358 return "{self}/{path}"
359 end
360
361 # Create a directory (and all intermediate directories if needed)
362 fun mkdir
363 do
364 var dirs = self.split_with("/")
365 var path = new Buffer
366 if dirs.is_empty then return
367 if dirs[0].is_empty then
368 # it was a starting /
369 path.add('/')
370 end
371 for d in dirs do
372 if d.is_empty then continue
373 path.append(d)
374 path.add('/')
375 path.to_s.to_cstring.file_mkdir
376 end
377 end
378
379 # Change the current working directory
380 #
381 # "/etc".chdir
382 # assert getcwd == "/etc"
383 # "..".chdir
384 # assert getcwd == "/"
385 #
386 # TODO: errno
387 fun chdir do to_cstring.file_chdir
388
389 # Return right-most extension (without the dot)
390 #
391 # Only the last extension is returned.
392 # There is no special case for combined extensions.
393 #
394 # assert "file.txt".file_extension == "txt"
395 # assert "file.tar.gz".file_extension == "gz"
396 #
397 # For file without extension, `null` is returned.
398 # Hoever, for trailing dot, `""` is returned.
399 #
400 # assert "file".file_extension == null
401 # assert "file.".file_extension == ""
402 #
403 # The starting dot of hidden files is never considered.
404 #
405 # assert ".file.txt".file_extension == "txt"
406 # assert ".file".file_extension == null
407 fun file_extension: nullable String
408 do
409 var last_slash = last_index_of('.')
410 if last_slash > 0 then
411 return substring( last_slash+1, length )
412 else
413 return null
414 end
415 end
416
417 # returns files contained within the directory represented by self
418 fun files : Set[ String ] is extern import HashSet[String], HashSet[String].add, NativeString.to_s, String.to_cstring, HashSet[String].as(Set[String]) `{
419 char *dir_path;
420 DIR *dir;
421
422 dir_path = String_to_cstring( recv );
423 if ((dir = opendir(dir_path)) == NULL)
424 {
425 perror( dir_path );
426 exit( 1 );
427 }
428 else
429 {
430 HashSet_of_String results;
431 String file_name;
432 struct dirent *de;
433
434 results = new_HashSet_of_String();
435
436 while ( ( de = readdir( dir ) ) != NULL )
437 if ( strcmp( de->d_name, ".." ) != 0 &&
438 strcmp( de->d_name, "." ) != 0 )
439 {
440 file_name = NativeString_to_s( strdup( de->d_name ) );
441 HashSet_of_String_add( results, file_name );
442 }
443
444 closedir( dir );
445 return HashSet_of_String_as_Set_of_String( results );
446 }
447 `}
448 end
449
450 redef class NativeString
451 private fun file_exists: Bool is extern "string_NativeString_NativeString_file_exists_0"
452 private fun file_stat: FileStat is extern "string_NativeString_NativeString_file_stat_0"
453 private fun file_lstat: FileStat `{
454 struct stat* stat_element;
455 int res;
456 stat_element = malloc(sizeof(struct stat));
457 res = lstat(recv, stat_element);
458 if (res == -1) return NULL;
459 return stat_element;
460 `}
461 private fun file_mkdir: Bool is extern "string_NativeString_NativeString_file_mkdir_0"
462 private fun file_delete: Bool is extern "string_NativeString_NativeString_file_delete_0"
463 private fun file_chdir is extern "string_NativeString_NativeString_file_chdir_0"
464 private fun file_realpath: NativeString is extern "file_NativeString_realpath"
465 end
466
467 extern FileStat `{ struct stat * `}
468 # This class is system dependent ... must reify the vfs
469 fun mode: Int is extern "file_FileStat_FileStat_mode_0"
470 fun atime: Int is extern "file_FileStat_FileStat_atime_0"
471 fun ctime: Int is extern "file_FileStat_FileStat_ctime_0"
472 fun mtime: Int is extern "file_FileStat_FileStat_mtime_0"
473 fun size: Int is extern "file_FileStat_FileStat_size_0"
474
475 fun is_reg: Bool `{ return S_ISREG(recv->st_mode); `}
476 fun is_dir: Bool `{ return S_ISDIR(recv->st_mode); `}
477 fun is_chr: Bool `{ return S_ISCHR(recv->st_mode); `}
478 fun is_blk: Bool `{ return S_ISBLK(recv->st_mode); `}
479 fun is_fifo: Bool `{ return S_ISFIFO(recv->st_mode); `}
480 fun is_lnk: Bool `{ return S_ISLNK(recv->st_mode); `}
481 fun is_sock: Bool `{ return S_ISSOCK(recv->st_mode); `}
482 end
483
484 # Instance of this class are standard FILE * pointers
485 private extern NativeFile `{ FILE* `}
486 fun io_read(buf: NativeString, len: Int): Int is extern "file_NativeFile_NativeFile_io_read_2"
487 fun io_write(buf: NativeString, len: Int): Int is extern "file_NativeFile_NativeFile_io_write_2"
488 fun io_close: Int is extern "file_NativeFile_NativeFile_io_close_0"
489 fun file_stat: FileStat is extern "file_NativeFile_NativeFile_file_stat_0"
490
491 new io_open_read(path: NativeString) is extern "file_NativeFileCapable_NativeFileCapable_io_open_read_1"
492 new io_open_write(path: NativeString) is extern "file_NativeFileCapable_NativeFileCapable_io_open_write_1"
493 new native_stdin is extern "file_NativeFileCapable_NativeFileCapable_native_stdin_0"
494 new native_stdout is extern "file_NativeFileCapable_NativeFileCapable_native_stdout_0"
495 new native_stderr is extern "file_NativeFileCapable_NativeFileCapable_native_stderr_0"
496 end
497
498 # Standard input.
499 fun stdin: Stdin do return once new Stdin
500
501 # Standard output.
502 fun stdout: OFStream do return once new Stdout
503
504 # Standard output for error.
505 fun stderr: OFStream do return once new Stderr