/*****************************************************************************\
*                                                                             *
*  Name   : find_non_ascii                                                    *
*  Author : Chris Koeritz                                                     *
*                                                                             *
*  Purpose:                                                                   *
*                                                                             *
*    Reads through a file looking for bytes with value greater than 127.      *
*                                                                             *
*******************************************************************************
* Copyright (c) 1991-$now By Author.  This program is free software; you can  *
* redistribute it and/or modify it under the terms of the GNU General Public  *
* License as published by the Free Software Foundation; either version 2 of   *
* the License or (at your option) any later version.  This is online at:      *
*     http://www.fsf.org/copyleft/gpl.html                                    *
* Please send any updates to: fred@gruntose.com                               *
\*****************************************************************************/

#include <basis/istring.h>
#include <opsystem/byte_filer.h>
#include <loggers/console_logger.h>
#include <data_struct/static_memory_gremlin.h>

HOOPLE_STARTUP_CODE;

const int BUFFER_SIZE = 32768;
  // this is the size of the chunk we read from the files at a time.  it is
  // important to make this a multiple of 16, since that's the size of the line
  // we use in the byte dumping.

#define fnc_console program_wide_logger()

int print_instructions_and_exit(char *program_name)
{
  fnc_console.log(istring(istring::SPRINTF, "\n\
Usage:\n\t%s filename [filename]\n\n\
Reads the files specified and reports characters whose value is greater\n\
than 127.  The reported line number and character positions start at one\n\
rather than the programmer's zero.\n\n",
      program_name).s());
  return 23;
}

int main(int argc, char *argv[])
{
  SET_DEFAULT_CONSOLE_LOGGER;

  if (argc <= 1) return print_instructions_and_exit(argv[0]);
  else {
    int current_parameter = 0;
    bool past_first_file = false;
    while (++current_parameter < argc) {
      if (past_first_file) {
        // we're into the second file so start using some white space.
        fnc_console.log("");
        fnc_console.log("");
      }
      past_first_file = true;  // set condition for next time.
      istring name = argv[current_parameter];
      byte_filer current(name, "rb");
      if (!current.good()) {
        fnc_console.log(istring("Cannot find the file named \"") + name
            + istring("\"."));
        continue;
      }
      byte buff[BUFFER_SIZE + 10];  // buffer plus some extra room.
      int line = 0;
      while (true) {
        line++;
        int bytes_read = current.getline(buff, BUFFER_SIZE);
        if (bytes_read <= 0) break;  // no contents.
//fnc_console.log(istring(istring::SPRINTF, "read %d bytes", bytes_read));

        for (int i = 0; i < bytes_read; i++) {
          if (buff[i] > 127) {
            fnc_console.log(isprintf("non-ascii char %d at line %d "
                "posn %d in file %s", int(buff[i]), line, i + 1, name.s()));
          }
        }

      }
    }
  }
  return 0;
}

#ifdef __BUILD_STATIC_APPLICATION__
  // static dependencies found by buildor_gen_deps.sh:
  #include <basis/array.cpp>
  #include <basis/byte_array.cpp>
  #include <basis/callstack_tracker.cpp>
  #include <basis/chaos.cpp>
  #include <basis/convert_utf.cpp>
  #include <basis/definitions.cpp>
  #include <basis/earth_time.cpp>
  #include <basis/guards.cpp>
  #include <basis/istring.cpp>
  #include <basis/log_base.cpp>
  #include <basis/memory_checker.cpp>
  #include <basis/mutex.cpp>
  #include <basis/object_base.cpp>
  #include <basis/outcome.cpp>
  #include <basis/packable.cpp>
  #include <basis/portable.cpp>
  #include <basis/sequence.cpp>
  #include <basis/set.cpp>
  #include <basis/utility.cpp>
  #include <basis/version_record.cpp>
  #include <data_struct/amorph.cpp>
  #include <data_struct/bit_vector.cpp>
  #include <data_struct/byte_hasher.cpp>
  #include <data_struct/configurator.cpp>
  #include <data_struct/hash_table.cpp>
  #include <data_struct/pointer_hash.cpp>
  #include <data_struct/stack.cpp>
  #include <data_struct/static_memory_gremlin.cpp>
  #include <data_struct/string_hash.cpp>
  #include <data_struct/string_hasher.cpp>
  #include <data_struct/string_table.cpp>
  #include <data_struct/symbol_table.cpp>
  #include <data_struct/table_configurator.cpp>
  #include <loggers/console_logger.cpp>
  #include <loggers/file_logger.cpp>
  #include <loggers/locked_logger.cpp>
  #include <loggers/null_logger.cpp>
  #include <loggers/program_wide_logger.cpp>
  #include <opsystem/byte_filer.cpp>
  #include <opsystem/command_line.cpp>
  #include <opsystem/critical_events.cpp>
  #include <opsystem/directory.cpp>
  #include <opsystem/filename.cpp>
  #include <opsystem/ini_config.cpp>
  #include <opsystem/ini_parser.cpp>
  #include <opsystem/path_configuration.cpp>
  #include <opsystem/rendezvous.cpp>
  #include <textual/byte_format.cpp>
  #include <textual/parser_bits.cpp>
  #include <textual/string_manipulation.cpp>
  #include <textual/tokenizer.cpp>
#endif // __BUILD_STATIC_APPLICATION__

