1 /*****************************************************************************\
4 * Author : Chris Koeritz *
6 *******************************************************************************
7 * Copyright (c) 1993-$now By Author. This program is free software; you can *
8 * redistribute it and/or modify it under the terms of the GNU General Public *
9 * License as published by the Free Software Foundation; either version 2 of *
10 * the License or (at your option) any later version. This is online at: *
11 * http://www.fsf.org/copyleft/gpl.html *
12 * Please send any updates to: fred@gruntose.com *
13 \*****************************************************************************/
15 // implementation note: the filename is kept canonicalized. any constructor
16 // or assignment operator should ensure this (except the blank constructor).
20 #include <basis/byte_array.h>
21 #include <basis/functions.h>
22 #include <textual/parser_bits.h>
26 #include <sys/types.h>
35 #define LOG(to_print) printf("%s::%s: %s\n", static_class_name(), func, astring(to_print).s())
37 using namespace basis;
38 using namespace structures;
40 class status_info : public stat
44 namespace filesystem {
46 #if defined(__WIN32__) || defined(__VMS__)
47 const char DEFAULT_SEPARATOR = '\\';
48 #elif defined(__UNIX__)
49 const char DEFAULT_SEPARATOR = '/';
51 #error "We have no idea what the default path separator is."
54 const char *NO_PARENT_DEFAULT = ".";
55 // used when no directory name can be popped off.
62 filename::filename(const astring &name)
67 filename::filename(const astring &directory, const astring &name_of_file)
71 // if the directory is empty, use the current directory.
73 *this = astring(NO_PARENT_DEFAULT);
74 _had_directory = false;
76 // check for a slash on the end of the directory. add one if there is none
78 bool add_slash = false;
79 if ( (directory[directory.end()] != '\\')
80 && (directory[directory.end()] != '/') ) add_slash = true;
81 if (add_slash) *this += DEFAULT_SEPARATOR;
82 *this += name_of_file;
86 filename::filename(const filename &to_copy)
88 _had_directory(to_copy._had_directory)
91 filename::~filename() {}
93 astring filename::default_separator() { return astring(DEFAULT_SEPARATOR, 1); }
95 astring &filename::raw() { return *this; }
97 const astring &filename::raw() const { return *this; }
99 bool filename::good() const { return exists(); }
101 bool filename::unlink() const { return ::unlink(observe()) == 0; }
103 astring filename::null_device()
112 bool filename::separator(char is_it)
113 { return (is_it == pc_separator) || (is_it == unix_separator); }
115 filename &filename::operator = (const filename &to_copy)
117 if (this == &to_copy) return *this;
118 (astring &)(*this) = to_copy;
119 _had_directory = to_copy._had_directory;
123 filename &filename::operator = (const astring &to_copy)
125 _had_directory = true;
126 if (this == &to_copy) return *this;
127 (astring &)(*this) = to_copy;
132 astring filename::pop()
134 astring to_return = basename();
135 filename parent_dir = parent();
136 if (parent_dir.raw().equal_to(NO_PARENT_DEFAULT)) {
137 // we haven't gone anywhere.
138 return ""; // signal that nothing was removed.
144 filename filename::parent() const { return dirname(); }
146 void filename::push(const astring &to_push)
148 *this = filename(*this, to_push);
151 void filename::canonicalize()
153 FUNCDEF("canonicalize");
154 // turn all the non-default separators into the default.
155 bool found_sep = false;
156 for (int j = 0; j < length(); j++) {
157 if (separator(get(j))) {
159 put(j, DEFAULT_SEPARATOR);
163 // if there wasn't a single directory separator, then they must not have
164 // specified any directory name for this filename (although it could itself
166 if (!found_sep) _had_directory = false;
168 // remove all occurrences of double separators except for the first
169 // double set, which could be a UNC filename. that's why the index below
170 // starts at one rather than zero.
171 bool saw_sep = false;
172 for (int i = 1; i < length(); i++) {
173 if (separator(get(i))) {
176 // two in a row is no good, except for the first two.
177 i--; // skip back one and try again.
181 } else saw_sep = false;
185 // on windows, we want to translate away from any cygwin or msys format into a more palatable
186 // version that the rest of windows understands.
188 const astring CYGDRIVE_PATH = astring(astring(DEFAULT_SEPARATOR, 1) + "cygdrive"
189 + astring(DEFAULT_SEPARATOR, 1));
190 // must be at least as long as the string we're looking for, plus a drive letter afterwards.
191 if ( (length() > CYGDRIVE_PATH.length() + 1) && begins(CYGDRIVE_PATH) ) {
192 zap(0, CYGDRIVE_PATH.length() + 1); // whack the cygdrive portion plus two slashes.
193 insert(1, ":"); // add a colon after the imputed drive letter.
195 // now we convert msys...
196 if ( (length() >= 2) && (get(0) == DEFAULT_SEPARATOR) && textual::parser_bits::is_alpha(get(1)) ) {
197 // we seem reasonably sure now that this is a windows path hiding in msys format, but
198 // the next character needs to be a slash (if there is a next character) for it to be
199 // the windows drive form. otherwise it could be /tmp, which would obviously not be
200 // intended as a windows path.
201 if ( (length() < 3) || (get(2) == DEFAULT_SEPARATOR) ) {
202 // cool, this should be interpretable as an msys path, except for those wacky types
203 // that use top-level single character directory names. we cannot help that, because
204 // we *know* msys is a choice used in other code a lot.
205 //hmmm: future revision: see if the file or directory '/x' actually exists on current drive? yuck.
206 zap(0, 0); // take off initial slash.
207 insert(1, ":"); // add the obligatory colon.
212 LOG(astring("ha ha turned string into: ") + *this);
214 // we don't crop the last separator if the name's too small. for msdos
215 // names, that would be chopping a slash off the c:\ style name.
217 // zap any separators that are hiding on the end.
218 const int last = end();
219 if (separator(get(last))) zap(last, last);
220 } else if ( (length() == 2) && (get(1) == ':') ) {
221 // special case for dos drive names. we turn it back into a valid
222 // directory rather than leaving it as just "X:". that form of the name
223 // means something else under dos/windows.
224 *this += astring(DEFAULT_SEPARATOR, 1);
228 char filename::drive(bool interact_with_fs) const
230 // first guess: if second letter's a colon, first letter's the drive.
235 if (!interact_with_fs)
238 // otherwise, retrieve the file system's record for the file.
240 if (!get_info(&fill))
242 return char('A' + fill.st_dev);
245 astring filename::extension() const
247 astring base(basename().raw());
248 int posn = base.find('.', base.end(), true);
251 return base.substring(posn + 1, base.length() - 1);
254 astring filename::rootname() const
256 astring base(basename().raw());
257 int posn = base.find('.', base.end(), true);
260 return base.substring(0, posn - 1);
263 bool filename::get_info(status_info *to_fill) const
265 int ret = stat(observe(), to_fill);
271 bool filename::is_directory() const
274 if (!get_info(&fill))
276 return !!(fill.st_mode & S_IFDIR);
279 bool filename::is_writable() const
282 if (!get_info(&fill))
284 return !!(fill.st_mode & S_IWRITE);
287 bool filename::is_readable() const
290 if (!get_info(&fill))
292 return !!(fill.st_mode & S_IREAD);
295 bool filename::is_executable() const
298 if (!get_info(&fill))
300 return !!(fill.st_mode & S_IEXEC);
303 int filename::find_last_separator(const astring &look_at) const
308 sep = look_at.find(DEFAULT_SEPARATOR, last_sep + 1);
309 if (sep >= 0) last_sep = sep;
314 filename filename::basename() const
316 astring basename = *this;
317 int last_sep = find_last_separator(basename);
318 if (last_sep >= 0) basename.zap(0, last_sep);
322 filename filename::dirname() const
324 astring dirname = *this;
325 int last_sep = find_last_separator(dirname);
326 // we don't accept ripping off the first slash.
328 // we can rip the slash and suffix off to get the directory name. however,
329 // this might be in the form X: on windows. if they want the slash to
330 // remain, they can use the dirname that appends it.
331 dirname.zap(last_sep, dirname.end());
333 if (get(0) == DEFAULT_SEPARATOR) {
334 // handle when we're up at the top of the filesystem. on unix, once
335 // you hit the root, you can keep going up but you still remain at
336 // the root. similarly on windoze, if there's no drive name in there.
337 dirname = astring(DEFAULT_SEPARATOR, 1);
339 // there's no slash at all in the filename any more. we assume that
340 // the directory is the current one, if no other information is
341 // available. this default is already used by some code.
342 dirname = NO_PARENT_DEFAULT;
348 astring filename::dirname(bool add_slash) const
350 astring tempname = dirname().raw();
351 if (add_slash) tempname += DEFAULT_SEPARATOR;
355 bool filename::exists() const
361 return is_readable();
362 /// byte_filer opened(observe(), "rb");
363 /// return opened.good();
366 bool filename::legal_character(char to_check)
371 case '*': case '?': case '$': case '&': case '|':
372 case '\'': case '"': case '`':
378 default: return true;
382 void filename::detooth_filename(astring &to_clean, char replacement)
384 for (int i = 0; i < to_clean.length(); i++) {
385 if (!legal_character(to_clean[i]))
386 to_clean[i] = replacement;
390 int filename::packed_size() const
392 return PACKED_SIZE_INT32 + astring::packed_size();
395 void filename::pack(byte_array &packed_form) const
397 attach(packed_form, int(_had_directory));
398 astring::pack(packed_form);
401 bool filename::unpack(byte_array &packed_form)
404 if (!detach(packed_form, temp))
406 _had_directory = temp;
407 if (!astring::unpack(packed_form))
412 void filename::separate(string_array &pieces) const
415 const astring &raw_form = raw();
416 astring accumulator; // holds the names we find.
417 for (int i = 0; i < raw_form.length(); i++) {
418 if (separator(raw_form[i])) {
419 // this is a separator character, so eat it and add the accumulated
420 // string to the list.
421 if (!i || accumulator.length()) pieces += accumulator;
422 // now reset our accumulated text.
423 accumulator = astring::empty_string();
425 // not a separator, so just accumulate it.
426 accumulator += raw_form[i];
429 if (accumulator.length()) pieces += accumulator;
432 void filename::join(const string_array &pieces)
434 astring constructed_name; // we'll make a filename here.
435 for (int i = 0; i < pieces.length(); i++) {
436 constructed_name += pieces[i];
437 if (!i || (i != pieces.length() - 1))
438 constructed_name += DEFAULT_SEPARATOR;
440 *this = constructed_name;
443 bool filename::base_compare_prefix(const filename &to_compare,
444 string_array &first, string_array &second)
447 to_compare.separate(second);
448 // that case should never be allowed, since there are some bits missing
449 // in the name to be compared.
450 if (first.length() > second.length())
453 // compare each of the pieces.
454 for (int i = 0; i < first.length(); i++) {
455 #if defined(__WIN32__) || defined(__VMS__)
456 // case-insensitive compare.
457 if (!first[i].iequals(second[i]))
460 // case-sensitive compare.
461 if (first[i] != second[i])
468 bool filename::compare_prefix(const filename &to_compare, astring &sequel)
470 sequel = astring::empty_string(); // clean our output parameter.
473 if (!base_compare_prefix(to_compare, first, second))
476 // create the sequel string.
477 int extra_strings = second.length() - first.length();
478 for (int i = second.length() - extra_strings; i < second.length(); i++) {
480 if (i != second.length() - 1) sequel += DEFAULT_SEPARATOR;
486 bool filename::compare_prefix(const filename &to_compare)
490 return base_compare_prefix(to_compare, first, second);
493 bool filename::base_compare_suffix(const filename &to_compare,
494 string_array &first, string_array &second)
497 to_compare.separate(second);
498 // that case should never be allowed, since there are some bits missing
499 // in the name to be compared.
500 if (first.length() > second.length())
503 // compare each of the pieces.
504 for (int i = first.length() - 1; i >= 0; i--) {
505 //clean up this computation; the difference in lengths is constant--use that.
506 int distance_from_end = first.length() - 1 - i;
507 int j = second.length() - 1 - distance_from_end;
508 #if defined(__WIN32__) || defined(__VMS__)
509 // case-insensitive compare.
510 if (!first[i].iequals(second[j]))
513 // case-sensitive compare.
514 if (first[i] != second[j])
521 bool filename::compare_suffix(const filename &to_compare, astring &prequel)
523 prequel = astring::empty_string(); // clean our output parameter.
526 if (!base_compare_suffix(to_compare, first, second))
529 // create the prequel string.
530 int extra_strings = second.length() - first.length();
531 for (int i = 0; i < extra_strings; i++) {
532 prequel += second[i];
533 if (i != second.length() - 1) prequel += DEFAULT_SEPARATOR;
538 bool filename::compare_suffix(const filename &to_compare)
542 return base_compare_suffix(to_compare, first, second);
545 bool filename::chmod(int write_mode, int owner_mode) const
549 if (write_mode & ALLOW_READ) {
550 if (owner_mode & USER_RIGHTS) chmod_value |= S_IRUSR;
551 if (owner_mode & GROUP_RIGHTS) chmod_value |= S_IRGRP;
552 if (owner_mode & OTHER_RIGHTS) chmod_value |= S_IROTH;
554 if (write_mode & ALLOW_WRITE) {
555 if (owner_mode & USER_RIGHTS) chmod_value |= S_IWUSR;
556 if (owner_mode & GROUP_RIGHTS) chmod_value |= S_IWGRP;
557 if (owner_mode & OTHER_RIGHTS) chmod_value |= S_IWOTH;
559 //// chmod_value = S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH;
560 #elif defined(__WIN32__)
561 if (write_mode & ALLOW_READ) {
562 chmod_value |= _S_IREAD;
564 if (write_mode & ALLOW_WRITE) {
565 chmod_value |= _S_IWRITE;
568 #error unsupported OS type currently.
570 int chmod_result = ::chmod(raw().s(), chmod_value);
572 // LOG(astring("there was a problem changing permissions on ") + raw());