/******************************************************** * ██████╗ ██████╗████████╗██╗ * ██╔════╝ ██╔════╝╚══██╔══╝██║ * ██║ ███╗██║ ██║ ██║ * ██║ ██║██║ ██║ ██║ * ╚██████╔╝╚██████╗ ██║ ███████╗ * ╚═════╝ ╚═════╝ ╚═╝ ╚══════╝ * Geophysical Computational Tools & Library (GCTL) * * Copyright (c) 2023 Yi Zhang (yizhang-geo@zju.edu.cn) * * GCTL is distributed under a dual licensing scheme. You can redistribute * it and/or modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation, either version 2 * of the License, or (at your option) any later version. You should have * received a copy of the GNU Lesser General Public License along with this * program. If not, see . * * If the terms and conditions of the LGPL v.2. would prevent you from using * the GCTL, please consider the option to obtain a commercial license for a * fee. These licenses are offered by the GCTL's original author. As a rule, * licenses are provided "as-is", unlimited in time for a one time fee. Please * send corresponding requests to: yizhang-geo@zju.edu.cn. Please do not forget * to include some tcription of your company and the realm of its activities. * Also add information on how to contact you by electronic and paper mail. ******************************************************/ #include "dsv_io.h" gctl::dsv_io::dsv_io() { file_ = ""; att_sym_ = '#'; tag_sym_ = '!'; deli_sym_ = ' '; head_num_ = 0; row_num_ = 0; col_num_ = 0; } gctl::dsv_io::~dsv_io() { clear(); } gctl::dsv_io::dsv_io(std::string filename, std::string file_exten, table_headtype_e t) { file_ = ""; att_sym_ = '#'; tag_sym_ = '!'; deli_sym_ = ' '; head_num_ = 0; row_num_ = 0; col_num_ = 0; if (file_exten == ".csv") load_csv(filename, t); else load_text(filename, file_exten, t); } void gctl::dsv_io::clear() { file_ = ""; att_sym_ = '#'; tag_sym_ = '!'; deli_sym_ = ' '; head_num_ = 0; row_num_ = 0; col_num_ = 0; destroy_vector(heads_); destroy_vector(annotates_); destroy_vector(tags_); destroy_vector(table_); return; } void gctl::dsv_io::get_row_names(std::vector &names) { names.resize(row_num_); for (size_t i = 1; i < row_num_; i++) { names[i] = table_[i][0].str_; } return; } void gctl::dsv_io::get_column_names(std::vector &names) { names.resize(col_num_); for (size_t i = 1; i < col_num_; i++) { names[i] = table_[0][i].str_; } return; } void gctl::dsv_io::set_row_names(const std::vector &names) { for (size_t i = 1; i <= std::min(row_num_, (int) names.size()); i++) { table_[i][0].str_ = names[i]; } table_[0][0].str_ = "row_name"; return; } void gctl::dsv_io::set_column_names(const std::vector &names) { for (size_t i = 1; i <= std::min(col_num_, (int) names.size()); i++) { table_[0][i].str_ = names[i]; } return; } void gctl::dsv_io::load_text(std::string filename, std::string file_exten, table_headtype_e t) { std::ifstream infile; open_infile(infile, filename, file_exten); file_ = filename + file_exten; int h = 0; std::string tmp_line; std::vector lines; while (std::getline(infile, tmp_line)) { if (tmp_line.empty()) continue; // 跳过空行 空行不会并记入头信息计数中 else if (tmp_line[0] == att_sym_) // 注释行或者标记行 # #! { if (tmp_line[1] == tag_sym_) // #! { tmp_line = tmp_line.substr(2); // 去掉前两个字符 tmp_line.erase(0, tmp_line.find_first_not_of(" \t")); tmp_line.erase(tmp_line.find_last_not_of(" \t") + 1); tags_.push_back(tmp_line); continue; } // # tmp_line = tmp_line.substr(1); // 去掉第一个字符 tmp_line.erase(0, tmp_line.find_first_not_of(" \t")); tmp_line.erase(tmp_line.find_last_not_of(" \t") + 1); annotates_.push_back(tmp_line); } else if (h < head_num_) //读入到头信息中 { heads_.push_back(tmp_line); h++; } else lines.push_back(tmp_line); } infile.close(); table_.resize(lines.size()); int cn, cn_max = 0; std::vector tmp_cols; for (size_t i = 0; i < lines.size(); i++) { tmp_cols.clear(); parse_string_to_vector(lines[i], deli_sym_, tmp_cols); // 动态调整列数 cn = tmp_cols.size(); cn_max = std::max(cn, cn_max); table_[i].resize(tmp_cols.size()); for (size_t j = 0; j < tmp_cols.size(); j++) { table_[i][j].str_ = tmp_cols[j]; } } // 补齐可能的空格 table_cell empty_cell; for (size_t i = 0; i < table_.size(); i++) { cn = table_[i].size(); for (size_t j = cn; j < cn_max; j++) { table_[i].push_back(empty_cell); } } std::vector empty_line; if (t == NoHead) // 无表头 需要补齐空白的列头和行头 { row_num_ = table_.size(); col_num_ = table_[0].size(); table_.emplace(table_.begin(), empty_line); table_[0].resize(col_num_); for (size_t i = 0; i < table_.size(); i++) { table_[i].emplace(table_[i].begin(), empty_cell); } } if (t == ColumnHead) // 有列头 需要补齐空白的行头 { row_num_ = table_.size() - 1; col_num_ = table_[0].size(); for (size_t i = 0; i < table_.size(); i++) { table_[i].emplace(table_[i].begin(), empty_cell); } } if (t == RowHead) // 有行头 需要补齐空白的列头 { row_num_ = table_.size(); col_num_ = table_[0].size() - 1; table_.emplace(table_.begin(), empty_line); table_[0].resize(col_num_ + 1); } if (t == BothHead) // 有行头和列头 { row_num_ = table_.size() - 1; col_num_ = table_[0].size() - 1; } destroy_vector(lines); return; } void gctl::dsv_io::load_csv(std::string filename, table_headtype_e t) { set_delimeter(','); load_text(filename, ".csv", t); return; } void gctl::dsv_io::save_text(std::string filename, std::string file_exten) { std::ofstream outfile; open_outfile(outfile, filename, file_exten); for (int i = 0; i < heads_.size(); i++) { outfile << heads_[i] << std::endl; } for (int i = 0; i < tags_.size(); i++) { outfile << "#! " << tags_[i] << std::endl; } for (int i = 0; i < annotates_.size(); i++) { outfile << "# " << annotates_[i] << std::endl; } // 单独处理第一行 即列头 bool line_st = false; if (table_[0][0].out_ok_ && table_[0][0].str_ != "") { outfile << table_[0][0].str_; line_st = true; } for (int j = 1; j <= col_num_; j++) { if (line_st && table_[0][j].out_ok_ && table_[0][j].str_ != "") outfile << deli_sym_ << table_[0][j].str_; // line started else if (table_[0][j].out_ok_ && table_[0][j].str_ != "") // line not started { outfile << table_[0][j].str_; line_st = true; // start line } } if (line_st) outfile << std::endl; // 处理余下的行 for (int i = 1; i <= row_num_; i++) { line_st = false; // 单独处理第一列 即行头 if (table_[i][0].out_ok_ && table_[i][0].str_ != "") { outfile << table_[i][0].str_; line_st = true; } for (int j = 1; j <= col_num_; j++) { if (line_st && table_[i][j].out_ok_) outfile << deli_sym_ << table_[i][j].str_; // line started else if (table_[i][j].out_ok_) // line not started { outfile << table_[i][j].str_; line_st = true; // start line } } outfile << std::endl; } outfile.close(); return; } void gctl::dsv_io::save_csv(std::string filename) { set_delimeter(','); save_text(filename, ".csv"); return; } void gctl::dsv_io::init_table(int row, int col, table_headtype_e t) { row_num_ = row; col_num_ = col; // 初始的列头和行头均为空白 table_.resize(row_num_ + 1); for (size_t i = 0; i < row_num_ + 1; i++) { table_[i].resize(col_num_ + 1); } return; } void gctl::dsv_io::info(table_headtype_e t) { std::clog << "File: " << file_ << "\n------------\n"; std::clog << "Head(s): " << head_num_ << "\n"; std::clog << "Annotation(s): " << annotates_.size() << "\n"; std::clog << "Tag(s): " << tags_.size() << "\n"; std::clog << "------------\n"; if (t == ColumnHead || t == BothHead) { std::clog << "Columns:\n"; for (size_t i = 1; i <= col_num_; i++) { if (table_[0][i].str_ != "") { std::clog << table_[0][i].str_ << ": " << table_[1][i].str_ << " -> " << table_[row_num_][i].str_; } else { std::clog << "C" + std::to_string(i) << ": " << table_[1][i].str_ << " -> " << table_[row_num_][i].str_; } if (!table_[0][i].out_ok_) std::clog << " (No output)"; std::clog << std::endl; } std::clog << "============\n"; } if (t == RowHead || t == BothHead) { std::clog << "Rows:\n"; for (size_t i = 1; i <= row_num_; i++) { if (table_[i][0].str_ != "") { std::clog << table_[i][0].str_ << ": " << table_[i][1].str_ << " -> " << table_[i][col_num_].str_; } else { std::clog << "R" + std::to_string(i) << ": " << table_[i][1].str_ << " -> " << table_[i][col_num_].str_; } if (!table_[i][0].out_ok_) std::clog << " (No output)"; std::clog << std::endl; } std::clog << "============\n"; } return; } int gctl::dsv_io::name_index(std::string name, bool iter_row) { // 拾取行号或列号 格式为R和C std::smatch ret; std::regex patr("R(\\d*)"), patc("C(\\d*)"); if (regex_search(name, ret, patr)) { int r = atoi(std::string(ret[1]).c_str()); if (r >= 1 && r <= row_num_) return r; else return -1; } if (regex_search(name, ret, patc)) { int c = atoi(std::string(ret[1]).c_str()); if (c >= 1 && c <= col_num_) return c; else return -1; } if (iter_row) { for (size_t i = 1; i <= row_num_; i++) { if (table_[i][0].str_ == name) return i; } return -1; } else { for (size_t i = 1; i <= col_num_; i++) { if (table_[0][i].str_ == name) return i; } return -1; } } void gctl::dsv_io::column_output(int idx, switch_type_e s) { if (idx > col_num_ || idx <= 0) { throw std::runtime_error("[gctl::dsv_io] Invalid column index."); } for (size_t i = 0; i <= row_num_; i++) { if (s == Enable) table_[i][idx].out_ok_ = true; else table_[i][idx].out_ok_ = false; } return; } void gctl::dsv_io::column_output(std::string name, switch_type_e s) { column_output(name_index(name), s); return; } void gctl::dsv_io::row_output(int idx, switch_type_e s) { if (idx > row_num_ || idx <= 0) { throw std::runtime_error("[gctl::dsv_io] Invalid row index."); } for (size_t i = 0; i <= col_num_; i++) { if (s == Enable) table_[idx][i].out_ok_ = true; else table_[idx][i].out_ok_ = false; } return; } void gctl::dsv_io::row_output(std::string name, switch_type_e s) { row_output(name_index(name), s); return; } void gctl::dsv_io::add_column(std::string name) { table_cell empty_cell; for (size_t i = 0; i < table_.size(); i++) { table_[i].push_back(empty_cell); } table_[0].back().str_ = name; col_num_++; return; } void gctl::dsv_io::add_column(int idx, std::string name) { table_cell empty_cell; if (idx <= 0) { for (size_t i = 0; i < table_.size(); i++) { table_[i].push_back(empty_cell); } table_[0].back().str_ = name; col_num_++; } else { for (size_t i = 0; i < table_.size(); i++) { table_[i].insert(table_[i].begin() + idx, empty_cell); } table_[0][idx].str_ = name; col_num_++; } return; } void gctl::dsv_io::add_column(std::string id_name, std::string name) { add_column(name_index(id_name), name); return; } gctl::geodsv_io::geodsv_io(){} gctl::geodsv_io::~geodsv_io(){} gctl::geodsv_io::geodsv_io(std::string filename, std::string file_exten, table_headtype_e t) { file_ = ""; att_sym_ = '#'; tag_sym_ = '!'; deli_sym_ = ' '; head_num_ = 0; row_num_ = 0; col_num_ = 0; if (file_exten == ".csv") load_csv(filename, t); else load_text(filename, file_exten, t); } void gctl::geodsv_io::fill_column_point2dc(const array &data, int xid, int yid, int p) { if (xid > col_num_ || yid > col_num_ || xid == yid || xid <= 0 || yid <= 0) { throw std::runtime_error("[gctl::geodsv_io] Invalid column index."); } std::stringstream ss; std::string s; for (size_t i = 1; i <= std::min(row_num_, (int) data.size()); i++) { ss.clear(); ss << data[i - 1].x; ss >> s; table_[i][xid].str_ = s; ss.clear(); ss << data[i - 1].y; ss >> s; table_[i][yid].str_ = s; } return; } void gctl::geodsv_io::fill_column_point2dc(const array &data, std::string xname, std::string yname, int p) { fill_column_point2dc(data, name_index(xname, false), name_index(yname, false), p); return; } void gctl::geodsv_io::fill_column_point3dc(const array &data, int xid, int yid, int zid, int p) { if (xid > col_num_ || yid > col_num_ || zid > col_num_ || xid == yid || yid == zid || xid == zid || xid <= 0 || yid <= 0 || zid <= 0) { throw std::runtime_error("[gctl::geodsv_io] Invalid column index."); } std::stringstream ss; std::string s; for (size_t i = 1; i < std::min(row_num_, (int) data.size()); i++) { ss.clear(); ss << data[i - 1].x; ss >> s; table_[i][xid].str_ = s; ss.clear(); ss << data[i - 1].y; ss >> s; table_[i][yid].str_ = s; ss.clear(); ss << data[i - 1].z; ss >> s; table_[i][zid].str_ = s; } return; } void gctl::geodsv_io::fill_column_point3dc(const array &data, std::string xname, std::string yname, std::string zname, int p) { fill_column_point3dc(data, name_index(xname, false), name_index(yname, false), name_index(zname, false), p); return; } void gctl::geodsv_io::get_column_point2dc(array &data, int xid, int yid) { if (xid > col_num_ || yid > col_num_ || xid == yid || xid <= 0 || yid <= 0) { throw std::runtime_error("[gctl::geodsv_io] Invalid column index."); } data.resize(row_num_); for (size_t i = 1; i <= row_num_; i++) { data[i - 1].x = table_[i][xid].value(); data[i - 1].y = table_[i][yid].value(); } return; } void gctl::geodsv_io::get_column_point2dc(array &data, std::string xname, std::string yname) { get_column_point2dc(data, name_index(xname, false), name_index(yname, false)); return; } void gctl::geodsv_io::get_column_point3dc(array &data, int xid, int yid, int zid) { if (xid > col_num_ || yid > col_num_ || zid > col_num_ || xid == yid || yid == zid || xid == zid || xid <= 0 || yid <= 0 || zid <= 0) { throw std::runtime_error("[gctl::geodsv_io] Invalid column index."); } data.resize(row_num_); for (size_t i = 1; i <= row_num_; i++) { data[i - 1].x = table_[i][xid].value(); data[i - 1].y = table_[i][yid].value(); data[i - 1].z = table_[i][zid].value(); } return; } void gctl::geodsv_io::get_column_point3dc(array &data, std::string xname, std::string yname, std::string zname) { get_column_point3dc(data, name_index(xname, false), name_index(yname, false), name_index(zname, false)); return; }