91超碰碰碰碰久久久久久综合_超碰av人澡人澡人澡人澡人掠_国产黄大片在线观看画质优化_txt小说免费全本

溫馨提示×

溫馨提示×

您好,登錄后才能下訂單哦!

密碼登錄×
登錄注冊×
其他方式登錄
點擊 登錄注冊 即表示同意《億速云用戶服務條款》

C++ Strassen算法代碼的實現

發布時間:2020-10-19 23:43:18 來源:腳本之家 閱讀:299 作者:Shiroha 欄目:編程語言

本文僅代碼,無理論解釋

實話實說,我覺得這個算法在C系列的語言下,簡直垃圾到爆炸……畢竟是一群完全不懂程序數學家對著紙弄出來的,看起來好像非常的有用,實際上耗時是非常爆炸的。

但是《算法導論》里有啊……然后上課又要求手寫一個

于是我就手寫了一個……我盡可能的減少使用的空間同時加快速度了,當 n = 512 的時候,內存使用量峰值沒有超過 10mb,而且是通過遞歸實現 Strassen 算法

其中,in.txt 已經預先準備了 3000000 個范圍在 0-100 隨機數,避免程序在運算過程中爆 int(雖然完全可以取1000)

/**
 * Created by Mauve on 3/29/2020.
 * Copyright © 2020 Mauve, All Rights Reserved
 */

#include <bits/stdc++.h>

using namespace std;

/**
 * 矩陣相乘
 * 最終結果耗時結果保存至
 * https://www.desmos.com/calculator/gl4tm5i1zu
 */

struct mat {
  unsigned row, col;

  mat(unsigned r, unsigned c) : row(r), col(c) {}

  virtual int &pos_ref(unsigned i, unsigned j) = 0;

  virtual int pos(unsigned i, unsigned j) const = 0;
};

struct base_mat;
struct sub_mat;

stack<sub_mat *> sub_data;

struct base_mat : mat {
  int *data;

  base_mat(unsigned r, unsigned c) : mat(r, c), data(new int[row * col]) {}

  ~base_mat() {
    delete[] data;
  }

  inline int &pos_ref(unsigned i, unsigned j) override {
    return *(data + i * col + j);
  }

  inline int pos(unsigned i, unsigned j) const override {
    return *(data + i * col + j);
  }
};

unsigned min_mul;

struct sub_mat : mat {
  mat *a, *b;
  bool is_add;
  unsigned offset_ai, offset_aj, offset_bi, offset_bj;

  explicit sub_mat(mat *data) : mat(data->row, data->col), a(data), b(nullptr),
                 is_add(false), offset_ai(0), offset_aj(0),
                 offset_bi(0), offset_bj(0) { sub_data.push(this); }

  sub_mat(mat *data, bool of_i, bool of_j) : mat(data->row >> 1u, data->col >> 1u), a(data), b(nullptr),
                        is_add(false), offset_ai(of_i ? data->row >> 1u : 0),
                        offset_aj(of_j ? data->col >> 1u : 0),
                        offset_bi(0), offset_bj(0) { sub_data.push(this); }

  inline int &pos_ref(unsigned i, unsigned j) override {
    assert(b == nullptr);
    return a->pos_ref(i + offset_ai, j + offset_aj);
  }

  inline int pos(unsigned i, unsigned j) const override {
    if (b == nullptr)
      return a->pos(i + offset_ai, j + offset_aj);
    return a->pos(i + offset_ai, j + offset_aj) + (is_add ? 1 : -1) * b->pos(i + offset_bi, j + offset_bj);
  }

  inline sub_mat *operator+(sub_mat &other) {
    auto res = new sub_mat(this);
    res->b = &other;
    res->is_add = true;
    return res;
  }

  inline sub_mat *operator-(sub_mat &other) {
    auto res = new sub_mat(this);
    res->b = &other;
    res->is_add = false;
    return res;
  }

  mat *operator*(sub_mat &other) {
    assert(col == other.row);
    auto res = new base_mat(row, other.col);
    if (col & 1u || row & 1u || col <= min_mul || row <= min_mul || other.col <= min_mul) {
      memset(res->data, 0, sizeof(int) * res->row * res->col);
      for (int k = 0; k < col; k++)
        for (int i = 0; i < row; ++i)
          for (int j = 0; j < other.col; ++j)
            res->pos_ref(i, j) += pos(i, k) * other.pos(k, j);
    } else {
      size_t sub_data_size = sub_data.size();
#define a(i, j) (*new sub_mat(this, i == 2 , j == 2))
#define b(i, j) (*new sub_mat(&other, i == 2 , j == 2))
      auto m1 = *(a(1, 1) + a(2, 2)) * *(b(1, 1) + b (2, 2));
      auto m2 = *(a(2, 1) + a(2, 2)) * b(1, 1);
      auto m3 = a(1, 1) * *(b(1, 2) - b(2, 2));
      auto m4 = a(2, 2) * *(b(2, 1) - b(1, 1));
      auto m5 = *(a(1, 1) + a(1, 2)) * b(2, 2);
      auto m6 = *(a(2, 1) - a(1, 1)) * *(b(1, 1) + b(1, 2));
      auto m7 = *(a(1, 2) - a(2, 2)) * *(b(2, 1) + b(2, 2));
#undef a
#undef b
      unsigned half_row = row >> 1u, half_col = col >> 1u;
#define m(t) (m##t->pos(i, j))
      // C11
      for (unsigned i = 0; i < half_row; ++i)
        for (unsigned j = 0; j < half_col; ++j)
          res->pos_ref(i, j) = m(1) + m(4) - m(5) + m(7);
      // C12
      for (unsigned i = 0; i < half_row; ++i)
        for (unsigned j = 0; j < half_col; ++j)
          res->pos_ref(i, j + half_col) = m(3) + m(5);
      // C21
      for (unsigned i = 0; i < half_row; ++i)
        for (unsigned j = 0; j < half_col; ++j)
          res->pos_ref(i + half_row, j) = m(2) + m(4);
      // C22
      for (unsigned i = 0; i < half_row; ++i)
        for (unsigned j = 0; j < half_col; ++j)
          res->pos_ref(i + half_row, j + half_col) = m(1) - m(2) + m(3) + m(6);
#undef m
      delete dynamic_cast<base_mat *>(m1);
      delete dynamic_cast<base_mat *>(m2);
      delete dynamic_cast<base_mat *>(m3);
      delete dynamic_cast<base_mat *>(m4);
      delete dynamic_cast<base_mat *>(m5);
      delete dynamic_cast<base_mat *>(m6);
      delete dynamic_cast<base_mat *>(m7);
      while (sub_data.size() > sub_data_size) {
        delete sub_data.top();
        sub_data.pop();
      }
    }
    return res;
  }
};

unsigned N = 2;

void solve() {
  cerr << "N = " << N << endl;
  base_mat a(N, N), b(N, N);
  for (int i = 0; i < N; ++i)
    for (int j = 0; j < N; ++j)
      cin >> a.pos_ref(i, j);
  for (int i = 0; i < N; ++i)
    for (int j = 0; j < N; ++j)
      cin >> b.pos_ref(i, j);

  for (int t = 1; t < min(10u, N); t += 3) {
    auto x = new sub_mat(&a), y = new sub_mat(&b);
    min_mul = t;

    auto time_1 = clock();
    auto z = *x * *y;
    auto time_2 = clock();

    cerr << "t = " << t << " time: " << double(time_2 - time_1) / CLOCKS_PER_SEC << endl;
    delete dynamic_cast<base_mat *>(z);
    while (!sub_data.empty()) {
      delete sub_data.top();
      sub_data.pop();
    }
  }

  auto x = new sub_mat(&a), y = new sub_mat(&b);
  min_mul = 10000;

  auto time_1 = clock();
  auto z = *x * *y;
  auto time_2 = clock();

  cerr << "tradition: " << double(time_2 - time_1) / CLOCKS_PER_SEC << endl;
  delete dynamic_cast<base_mat *>(z);
  while (!sub_data.empty()) {
    delete sub_data.top();
    sub_data.pop();
  }
  N *= 2;
  if (N >= 1000) exit(0);
}

signed main() {
  ios_base::sync_with_stdio(false);
  cin.tie(nullptr);
  cout.tie(nullptr);
#ifdef ACM_LOCAL
  freopen("in.txt", "r", stdin);
  freopen("out.txt", "w", stdout);
  long long test_index_for_debug = 1;
  char acm_local_for_debug;
  while (cin >> acm_local_for_debug && acm_local_for_debug != '~') {
    cin.putback(acm_local_for_debug);
    if (test_index_for_debug > 20) {
      throw runtime_error("Check the stdin!!!");
    }
    auto start_clock_for_debug = clock();
    solve();
    auto end_clock_for_debug = clock();
    cout << "Test " << test_index_for_debug << " successful" << endl;
    cerr << "Test " << test_index_for_debug++ << " Run Time: "
       << double(end_clock_for_debug - start_clock_for_debug) / CLOCKS_PER_SEC << "s" << endl;
    cout << "--------------------------------------------------" << endl;
  }
#else
  solve();
#endif
  return 0;
}

到此這篇關于C++ Strassen算法代碼的實現的文章就介紹到這了,更多相關C++ Strassen算法 內容請搜索億速云以前的文章或繼續瀏覽下面的相關文章希望大家以后多多支持億速云!

向AI問一下細節

免責聲明:本站發布的內容(圖片、視頻和文字)以原創、轉載和分享為主,文章觀點不代表本網站立場,如果涉及侵權請聯系站長郵箱:is@yisu.com進行舉報,并提供相關證據,一經查實,將立刻刪除涉嫌侵權內容。

AI

万宁市| 邯郸市| 中阳县| 襄垣县| 昌平区| 洞头县| 泊头市| 兰考县| 沁源县| 修武县| 平原县| 福贡县| 胶南市| 丹阳市| 方城县| 葫芦岛市| 巨野县| 大邑县| 维西| 东海县| 乌鲁木齐县| 都江堰市| 德钦县| 额敏县| 芦溪县| 喀喇沁旗| 博客| 虞城县| 潍坊市| 普兰县| 大渡口区| 分宜县| 阿拉尔市| 湘阴县| 新乡市| 南溪县| 资中县| 富源县| 金秀| 简阳市| 平邑县|