// #define _CRT_SECURE_NO_WARNINGS
#include <iostream>
#include <algorithm>
#include <cmath>
#include <climits>
#include <vector>
#include <queue>
#include <deque>
#include <array>
#include <list>
#include <stack>
#include <tuple>
#include <set>
#include <unordered_set>
#include <map>
#include <unordered_map>
#include <string>
#include <cstring>
#include <random>
#include <bitset>
#include <iomanip>
#include <iterator>
#include <functional>
#include <ctime>
#include <chrono>
#include <cctype>
#include <fstream>
#include <numeric>
#include <complex>
#include <cassert>
using namespace std;
// #pragma GCC optimize("Ofast")
// #pragma GCC target("avx2,bmi,bmi2,lzcnt,popcnt")
#define int long long
#define sz(x) ((int)(x).size())
#define mp make_pair
#define all(x) (x).begin(), (x).end()
#define pb push_back
#define pf push_front
#define ff first
#define ss second
#define unique(x) (x).erase(unique(all(x)), (x).end())
#define min3(a, b, c) min(a, min(b, c))
#define max3(a, b, c) max(a, max(b, c))
#define FOR(i, a, b) for (int i = (a); i <= (b); i++)
#define ROF(i, a, b) for (int i = (a); i >= (b); i--)
using vi = vector<int>;
using vd = vector<double>;
using vpii = vector<pair<int, int>>;
using vpdd = vector<pair<double, double>>;
using pii = pair<int, int>;
using pdd = pair<double, double>;
// #include <ext/pb_ds/assoc_container.hpp>
// #include <ext/pb_ds/tree_policy.hpp>
// using namespace __gnu_pbds;
// typedef tree<int, null_type, less<int>, rb_tree_tag, tree_order_statistics_node_update> ordered_set;
template<typename T> using min_heap = priority_queue<T, vector<T>, greater<T>>;
template<typename T> using max_heap = priority_queue<T>;
#define BIT(n) (1LL << (n))
#define HAS_BIT(x, n) (((x) >> (n)) & 1)
#define SET_BIT(x, n) ((x) | BIT(n))
template <typename Container>
void PRINT(const Container& container) {
for (const auto& e : container) {
cout << e << ' ';
} cout << '\n';
}
void print_double(double ans, int num) {
cout << fixed << setprecision(num) << ans << '\n';
}
const int inf = 1e18;
const double eps = 1e-9;
const double PI = 3.141592653589793;
string alh = "abcdefghijklmnopqrstuvwxyz";
string ALH = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";
class TP {
private:
vector<vector<int>> c;
vector<int> s;
vector<int> d;
int m, n;
vector<pair<int, int>> findCyc(vector<vector<int>>& sol, int si, int sj) {
int tot = m + n;
vector<int> par(tot, -1);
vector<bool> vis(tot, false);
queue<int> q;
vis[si] = true;
q.push(si);
int tar = sj + m;
while (!q.empty()) {
int node = q.front();
q.pop();
if (node < m) {
int i = node;
for (int j = 0; j < n; j++) {
if (sol[i][j] > 0) {
int cn = j + m;
if (!vis[cn]) {
vis[cn] = true;
par[cn] = node;
q.push(cn);
if (cn == tar) {
vector<int> path;
int cur = cn;
while (cur != -1) {
path.push_back(cur);
cur = par[cur];
}
reverse(path.begin(), path.end());
vector<pair<int, int>> cyc;
cyc.push_back({ si, sj });
for (int idx = 0; idx < path.size() - 1; idx++) {
int n1 = path[idx];
int n2 = path[idx + 1];
if (n1 < m && n2 >= m) {
cyc.push_back({ n1, n2 - m });
}
else if (n1 >= m && n2 < m) {
cyc.push_back({ n2, n1 - m });
}
}
return cyc;
}
}
}
}
}
else {
int j = node - m;
for (int i = 0; i < m; i++) {
if (sol[i][j] > 0) {
int rn = i;
if (!vis[rn]) {
vis[rn] = true;
par[rn] = node;
q.push(rn);
}
}
}
}
}
return {};
}
void redist(vector<vector<int>>& sol, vector<pair<int, int>>& cyc) {
if (cyc.size() < 4) return;
int theta = INT_MAX;
for (int i = 1; i < cyc.size(); i += 2) {
int x = cyc[i].first, y = cyc[i].second;
if (sol[x][y] < theta) {
theta = sol[x][y];
}
}
for (int i = 0; i < cyc.size(); i++) {
int x = cyc[i].first, y = cyc[i].second;
if (i % 2 == 0) {
sol[x][y] += theta;
}
else {
sol[x][y] -= theta;
}
}
}
public:
TP(vector<vector<int>> c, vector<int> s, vector<int> d)
: c(c), s(s), d(d) {
m = s.size();
n = d.size();
}
vector<vector<int>> NW() {
vector<vector<int>> sol(m, vector<int>(n, 0));
vector<int> sup = s, dem = d;
int i = 0, j = 0;
while (i < m && j < n) {
int amt = min(sup[i], dem[j]);
sol[i][j] = amt;
sup[i] -= amt;
dem[j] -= amt;
if (sup[i] == 0) i++;
if (dem[j] == 0) j++;
}
return sol;
}
vector<vector<int>> solve() {
auto sol = NW();
int iter = 0;
const int MAX_ITER = 100;
while (iter++ < MAX_ITER) {
vector<int> u(m, INT_MAX), v(n, INT_MAX);
u[0] = 0;
bool ch;
do {
ch = false;
for (int i = 0; i < m; i++) {
for (int j = 0; j < n; j++) {
if (sol[i][j] > 0) {
if (u[i] != INT_MAX && v[j] == INT_MAX) {
v[j] = c[i][j] - u[i];
ch = true;
}
else if (v[j] != INT_MAX && u[i] == INT_MAX) {
u[i] = c[i][j] - v[j];
ch = true;
}
}
}
}
} while (ch);
int minD = 0;
int bestI = -1, bestJ = -1;
for (int i = 0; i < m; i++) {
for (int j = 0; j < n; j++) {
if (sol[i][j] == 0) {
if (u[i] == INT_MAX || v[j] == INT_MAX) continue;
int delta = c[i][j] - (u[i] + v[j]);
if (delta < minD) {
minD = delta;
bestI = i;
bestJ = j;
}
}
}
}
if (minD >= 0) break;
auto cyc = findCyc(sol, bestI, bestJ);
if (cyc.empty()) {
cout << "Cycle not found for cell (" << bestI << "," << bestJ << ")" << endl;
break;
}
redist(sol, cyc);
}
return sol;
}
int calcCost(const vector<vector<int>>& sol) {
int tot = 0;
for (int i = 0; i < m; i++) {
for (int j = 0; j < n; j++) {
tot += sol[i][j] * c[i][j];
}
}
return tot;
}
void printSol(const vector<vector<int>>& sol) {
cout << " ";
for (int j = 0; j < n; j++) cout << setw(3) << "B" << j + 1;
cout << setw(6) << "Sup" << endl;
for (int i = 0; i < m; i++) {
cout << "A" << i + 1 << " ";
int rs = 0;
for (int j = 0; j < n; j++) {
cout << setw(4) << sol[i][j];
rs += sol[i][j];
}
cout << setw(6) << rs << endl;
}
cout << "Dem ";
for (int j = 0; j < n; j++) {
int cs = 0;
for (int i = 0; i < m; i++) {
cs += sol[i][j];
}
cout << setw(4) << cs;
}
cout << endl;
}
};
void Solve() {
vector<int> s = { 120, 90, 150 };
vector<int> d = { 50, 60, 40, 70, 30, 20, 90 };
vector<vector<int>> c = {
{4, 7, 2, 5, 8, 3, 6},
{9, 1, 6, 4, 2, 7, 5},
{3, 8, 5, 9, 1, 4, 2}
};
TP tp(c, s, d);
auto nw = tp.NW();
int nwCost = tp.calcCost(nw);
cout << "North-West corner cost: " << nwCost << endl;
auto opt = tp.solve();
int optCost = tp.calcCost(opt);
cout << "Optimal solution cost: " << optCost << endl;
tp.printSol(opt);
bool ok = true;
for (int i = 0; i < s.size(); i++) {
int rs = 0;
for (int j = 0; j < d.size(); j++) {
rs += opt[i][j];
}
if (rs != s[i]) {
cout << "R " << i << " error: " << rs << " != " << s[i] << endl;
ok = false;
}
}
for (int j = 0; j < d.size(); j++) {
int cs = 0;
for (int i = 0; i < s.size(); i++) {
cs += opt[i][j];
}
if (cs != d[j]) {
cout << "C " << j << " error: " << cs << " != " << d[j] << endl;
ok = false;
}
}
}
signed main() {
ios_base::sync_with_stdio(false);
cin.tie(0);
cout.tie(0);
/*
________________
/ Just solved it \
| in my mind |
\________________/
/
/
/> フ ___________
| _ _| | |
/`ミ _x 彡 | WA 2 |
/ | |__________|
/ ヽ ノ / /
/ ̄| | | | /_________ /
| ( ̄ヽ__ヽ_)_)
\二つ
*/
/*
freopen("task.in", "r", stdin);
freopen("task.out", "w", stdout);
*/
// auto start = chrono::high_resolution_clock::now();
int multitest = false;
if (multitest == true) {
int ctt; cin >> ctt;
for (int i = 0; i < ctt; i++) {
Solve();
}
}
else {
Solve();
}
// auto end = chrono::high_resolution_clock::now();
/*
cout << "Time taken: "
<< chrono::duration_cast<chrono::milliseconds>(end - start).count()
<< " milliseconds" << endl;
*/
return 0;
}
// #define _CRT_SECURE_NO_WARNINGS 

#include <iostream> 
#include <algorithm> 
#include <cmath> 
#include <climits> 
#include <vector> 
#include <queue> 
#include <deque> 
#include <array> 
#include <list> 
#include <stack> 
#include <tuple> 
#include <set> 
#include <unordered_set> 
#include <map> 
#include <unordered_map> 
#include <string> 
#include <cstring> 
#include <random> 
#include <bitset> 
#include <iomanip> 
#include <iterator> 
#include <functional> 
#include <ctime> 
#include <chrono> 
#include <cctype> 
#include <fstream> 
#include <numeric> 
#include <complex> 
#include <cassert> 

using namespace std;

// #pragma GCC optimize("Ofast")
// #pragma GCC target("avx2,bmi,bmi2,lzcnt,popcnt")

#define int               long long 
#define sz(x)             ((int)(x).size()) 
#define mp                make_pair 
#define all(x)            (x).begin(), (x).end() 
#define pb                push_back 
#define pf                push_front 
#define ff                first 
#define ss                second 
#define unique(x)         (x).erase(unique(all(x)), (x).end()) 
#define min3(a, b, c)     min(a, min(b, c)) 
#define max3(a, b, c)     max(a, max(b, c)) 
#define FOR(i, a, b)      for (int i = (a); i <= (b); i++) 
#define ROF(i, a, b)      for (int i = (a); i >= (b); i--) 

using vi = vector<int>;
using vd = vector<double>;
using vpii = vector<pair<int, int>>;
using vpdd = vector<pair<double, double>>;
using pii = pair<int, int>;
using pdd = pair<double, double>;

// #include <ext/pb_ds/assoc_container.hpp>
// #include <ext/pb_ds/tree_policy.hpp>
// using namespace __gnu_pbds;
// typedef tree<int, null_type, less<int>, rb_tree_tag, tree_order_statistics_node_update> ordered_set;

template<typename T> using min_heap = priority_queue<T, vector<T>, greater<T>>;
template<typename T> using max_heap = priority_queue<T>;

#define BIT(n) (1LL << (n))
#define HAS_BIT(x, n) (((x) >> (n)) & 1)
#define SET_BIT(x, n) ((x) | BIT(n))

template <typename Container>
void PRINT(const Container& container) {
    for (const auto& e : container) {
        cout << e << ' ';
    } cout << '\n';
}

void print_double(double ans, int num) {
    cout << fixed << setprecision(num) << ans << '\n';
}

const int inf = 1e18;
const double eps = 1e-9;
const double PI = 3.141592653589793;

string alh = "abcdefghijklmnopqrstuvwxyz";
string ALH = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";

class TP {
private:
    vector<vector<int>> c;
    vector<int> s;
    vector<int> d;
    int m, n;

    vector<pair<int, int>> findCyc(vector<vector<int>>& sol, int si, int sj) {
        int tot = m + n;
        vector<int> par(tot, -1);
        vector<bool> vis(tot, false);
        queue<int> q;

        vis[si] = true;
        q.push(si);
        int tar = sj + m;

        while (!q.empty()) {
            int node = q.front();
            q.pop();

            if (node < m) {
                int i = node;
                for (int j = 0; j < n; j++) {
                    if (sol[i][j] > 0) {
                        int cn = j + m;
                        if (!vis[cn]) {
                            vis[cn] = true;
                            par[cn] = node;
                            q.push(cn);
                            if (cn == tar) {
                                vector<int> path;
                                int cur = cn;
                                while (cur != -1) {
                                    path.push_back(cur);
                                    cur = par[cur];
                                }
                                reverse(path.begin(), path.end());

                                vector<pair<int, int>> cyc;
                                cyc.push_back({ si, sj });

                                for (int idx = 0; idx < path.size() - 1; idx++) {
                                    int n1 = path[idx];
                                    int n2 = path[idx + 1];
                                    if (n1 < m && n2 >= m) {
                                        cyc.push_back({ n1, n2 - m });
                                    }
                                    else if (n1 >= m && n2 < m) {
                                        cyc.push_back({ n2, n1 - m });
                                    }
                                }
                                return cyc;
                            }
                        }
                    }
                }
            }
            else {
                int j = node - m;
                for (int i = 0; i < m; i++) {
                    if (sol[i][j] > 0) {
                        int rn = i;
                        if (!vis[rn]) {
                            vis[rn] = true;
                            par[rn] = node;
                            q.push(rn);
                        }
                    }
                }
            }
        }
        return {};
    }

    void redist(vector<vector<int>>& sol, vector<pair<int, int>>& cyc) {
        if (cyc.size() < 4) return;

        int theta = INT_MAX;
        for (int i = 1; i < cyc.size(); i += 2) {
            int x = cyc[i].first, y = cyc[i].second;
            if (sol[x][y] < theta) {
                theta = sol[x][y];
            }
        }

        for (int i = 0; i < cyc.size(); i++) {
            int x = cyc[i].first, y = cyc[i].second;
            if (i % 2 == 0) {
                sol[x][y] += theta;
            }
            else {
                sol[x][y] -= theta;
            }
        }
    }

public:
    TP(vector<vector<int>> c, vector<int> s, vector<int> d)
        : c(c), s(s), d(d) {
        m = s.size();
        n = d.size();
    }

    vector<vector<int>> NW() {
        vector<vector<int>> sol(m, vector<int>(n, 0));
        vector<int> sup = s, dem = d;
        int i = 0, j = 0;

        while (i < m && j < n) {
            int amt = min(sup[i], dem[j]);
            sol[i][j] = amt;
            sup[i] -= amt;
            dem[j] -= amt;

            if (sup[i] == 0) i++;
            if (dem[j] == 0) j++;
        }
        return sol;
    }

    vector<vector<int>> solve() {
        auto sol = NW();
        int iter = 0;
        const int MAX_ITER = 100;

        while (iter++ < MAX_ITER) {
            vector<int> u(m, INT_MAX), v(n, INT_MAX);
            u[0] = 0;

            bool ch;
            do {
                ch = false;
                for (int i = 0; i < m; i++) {
                    for (int j = 0; j < n; j++) {
                        if (sol[i][j] > 0) {
                            if (u[i] != INT_MAX && v[j] == INT_MAX) {
                                v[j] = c[i][j] - u[i];
                                ch = true;
                            }
                            else if (v[j] != INT_MAX && u[i] == INT_MAX) {
                                u[i] = c[i][j] - v[j];
                                ch = true;
                            }
                        }
                    }
                }
            } while (ch);

            int minD = 0;
            int bestI = -1, bestJ = -1;

            for (int i = 0; i < m; i++) {
                for (int j = 0; j < n; j++) {
                    if (sol[i][j] == 0) {
                        if (u[i] == INT_MAX || v[j] == INT_MAX) continue;
                        int delta = c[i][j] - (u[i] + v[j]);
                        if (delta < minD) {
                            minD = delta;
                            bestI = i;
                            bestJ = j;
                        }
                    }
                }
            }

            if (minD >= 0) break;

            auto cyc = findCyc(sol, bestI, bestJ);
            if (cyc.empty()) {
                cout << "Cycle not found for cell (" << bestI << "," << bestJ << ")" << endl;
                break;
            }

            redist(sol, cyc);
        }

        return sol;
    }

    int calcCost(const vector<vector<int>>& sol) {
        int tot = 0;
        for (int i = 0; i < m; i++) {
            for (int j = 0; j < n; j++) {
                tot += sol[i][j] * c[i][j];
            }
        }
        return tot;
    }

    void printSol(const vector<vector<int>>& sol) {
        cout << "    ";
        for (int j = 0; j < n; j++) cout << setw(3) << "B" << j + 1;
        cout << setw(6) << "Sup" << endl;

        for (int i = 0; i < m; i++) {
            cout << "A" << i + 1 << "  ";
            int rs = 0;
            for (int j = 0; j < n; j++) {
                cout << setw(4) << sol[i][j];
                rs += sol[i][j];
            }
            cout << setw(6) << rs << endl;
        }

        cout << "Dem ";
        for (int j = 0; j < n; j++) {
            int cs = 0;
            for (int i = 0; i < m; i++) {
                cs += sol[i][j];
            }
            cout << setw(4) << cs;
        }
        cout << endl;
    }
};

void Solve() {
    vector<int> s = { 120, 90, 150 };
    vector<int> d = { 50, 60, 40, 70, 30, 20, 90 };
    vector<vector<int>> c = {
        {4, 7, 2, 5, 8, 3, 6},
        {9, 1, 6, 4, 2, 7, 5},
        {3, 8, 5, 9, 1, 4, 2}
    };

    TP tp(c, s, d);

    auto nw = tp.NW();
    int nwCost = tp.calcCost(nw);
    cout << "North-West corner cost: " << nwCost << endl;

    auto opt = tp.solve();
    int optCost = tp.calcCost(opt);
    cout << "Optimal solution cost: " << optCost << endl;

    tp.printSol(opt);

    bool ok = true;
    for (int i = 0; i < s.size(); i++) {
        int rs = 0;
        for (int j = 0; j < d.size(); j++) {
            rs += opt[i][j];
        }
        if (rs != s[i]) {
            cout << "R " << i << " error: " << rs << " != " << s[i] << endl;
            ok = false;
        }
    }

    for (int j = 0; j < d.size(); j++) {
        int cs = 0;
        for (int i = 0; i < s.size(); i++) {
            cs += opt[i][j];
        }
        if (cs != d[j]) {
            cout << "C " << j << " error: " << cs << " != " << d[j] << endl;
            ok = false;
        }
    }
}

signed main() {
    ios_base::sync_with_stdio(false);
    cin.tie(0);
    cout.tie(0);

    /*
                      ________________
                     / Just solved it \
                     |   in my mind   |
                     \________________/
                    /
                   /
　　　　　／＞　 フ         ___________
　　　　　| 　_　 _|       |          |
　 　　　／`ミ _x 彡       |   WA 2   |
　　 　 /　　　 　 |       |__________|
　　　 /　 ヽ　　 ﾉ        /          /
　／￣|　　 |　|　|       /_________ /
　| (￣ヽ＿_ヽ_)_)
　＼二つ

    */

    /*
    freopen("task.in", "r", stdin);
    freopen("task.out", "w", stdout);
    */

    // auto start = chrono::high_resolution_clock::now();

    int multitest = false;
    if (multitest == true) {
        int ctt; cin >> ctt;

        for (int i = 0; i < ctt; i++) {
            Solve();
        }
    }
    else {
        Solve();
    }

    // auto end = chrono::high_resolution_clock::now();

    /*
    cout << "Time taken: "
         << chrono::duration_cast<chrono::milliseconds>(end - start).count()
         << " milliseconds" << endl;
    */

    return 0;
}