#include<bits/stdc++.h>
using namespace std;
static struct FastInput {
static constexpr int BUF_SIZE = 1 << 20;
char buf[BUF_SIZE];
size_t chars_read = 0;
size_t buf_pos = 0;
FILE *in = stdin;
char cur = 0;
inline char get_char() {
if (buf_pos >= chars_read) {
chars_read = fread(buf, 1, BUF_SIZE, in);
buf_pos = 0;
buf[0] = (chars_read == 0 ? -1 : buf[0]);
}
return cur = buf[buf_pos++];
}
inline void tie(int) {}
inline explicit operator bool() {
return cur != -1;
}
inline static bool is_blank(char c) {
return c <= ' ';
}
inline bool skip_blanks() {
while (is_blank(cur) && cur != -1) {
get_char();
}
return cur != -1;
}
inline FastInput& operator>>(char& c) {
skip_blanks();
c = cur;
return *this;
}
inline FastInput& operator>>(string& s) {
if (skip_blanks()) {
s.clear();
do {
s += cur;
} while (!is_blank(get_char()));
}
return *this;
}
template <typename T>
inline FastInput& read_integer(T& n) {
// unsafe, doesn't check that characters are actually digits
n = 0;
if (skip_blanks()) {
int sign = +1;
if (cur == '-') {
sign = -1;
get_char();
}
do {
n += n + (n << 3) + cur - '0';
} while (!is_blank(get_char()));
n *= sign;
}
return *this;
}
template <typename T>
inline typename enable_if<is_integral<T>::value, FastInput&>::type operator>>(T& n) {
return read_integer(n);
}
#if !defined(_WIN32) || defined(_WIN64)
inline FastInput& operator>>(__int128& n) {
return read_integer(n);
}
#endif
template <typename T>
inline typename enable_if<is_floating_point<T>::value, FastInput&>::type operator>>(T& n) {
// not sure if really fast, for compatibility only
n = 0;
if (skip_blanks()) {
string s;
(*this) >> s;
sscanf(s.c_str(), "%lf", &n);
}
return *this;
}
} fast_input;
#define cin fast_input
#define ii pair<int,int>
#define fi first
#define se second
//#define int long long
#define FOR(i, a, b) for(int i = (a); i <= (b); i++)
#define ll long long
#define ld double
#define mp make_pair
#define lg2 30
#define iii pair<int,ii>
#define iiii pair<ii,ii>
#define base 29
#define eps 1e-8
#define MASK(i) (1LL << (i))
#define BIT(S, i) (((S) >> (i)) & 1)
int dx[]= {0LL,0LL,1,-1,1,1,-1,-1};
int dy[]= {1,-1,0LL,0LL,1,-1,1,-1};
const int maxn=1e5+1,S=600,size_S=maxn/S+2;
const int mod=1e9+7;
struct FEN
{
int n;
ll bit1[S+1],bit2[S+1];
FEN() {};
FEN(int _n):n(_n+1)
{
};
ll get(ll bit[] ,int r)
{
ll ret = 0;
for (; r > 0; r = (r & (r + 1)) - 1)
ret += bit[r];
return ret;
}
void update(ll bit[],int idx, int delta)
{
for (; idx < n; idx = idx | (idx + 1))
bit[idx] += delta;
}
void updateRange(int l, int r, int v)
{
update(bit1, l, (n - l + 1) * v);
update(bit1, r + 1,-(n - r) * v);
update(bit2, l, v);
update(bit2, r + 1, -v);
}
ll pre(int u)
{
return get(bit1, u) - get(bit2, u) *1LL* (n - u);
}
ll getRange(int l, int r)
{
if(l>r)return 0;
return pre(r) - (l == 1 ? 0 : pre(l - 1));
}
} bit[size_S];
int n,L[size_S],R[size_S],q,pos[maxn],p[maxn],cnt,id[maxn];
ll lazy[size_S];
vector<int> nen[size_S];
struct Query {
int type, l, r, x;
} Q[maxn];
struct SegmentTree {
int n;
vector<ll> node, lazy;
SegmentTree(int n = 0): n(n), node((n << 2) + 5, 0), lazy((n << 2) + 5, 0) {}
void pushDown(int id, int l, int r) {
ll &t = lazy[id];
if (t) {
int mid = (l + r) >> 1;
node[id << 1] += t * (mid - l + 1);
node[id << 1 | 1] += t * (r - mid);
lazy[id << 1] += t;
lazy[id << 1 | 1] += t;
t = 0;
}
}
void update(int id, int l, int r, int u, int v, int k) {
if (l > v || r < u) return;
if (u <= l && r <= v) {
node[id] += 1LL * (r - l + 1) * k;
lazy[id] += k;
return;
}
pushDown(id, l, r);
int mid = (l + r) >> 1;
update(id << 1, l, mid, u, v, k);
update(id << 1 | 1, mid + 1, r, u, v, k);
node[id] = node[id << 1] + node[id << 1 | 1];
}
ll getSum(int id, int l, int r, int u, int v) {
if (l > v || r < u) return 0;
if (u <= l && r <= v) return node[id];
pushDown(id, l, r);
int mid = (l + r) >> 1;
return getSum(id << 1, l, mid, u, v) + getSum(id << 1 | 1, mid + 1, r, u, v);
}
} IT;
namespace Subtask2 {
bool check() {
FOR(i, 1, q) if (Q[i].type != 1 && Q[i].type != 3)
return false;
return true;
}
void solve() {
IT = SegmentTree(n);
FOR(i, 1, q) {
if (Q[i].type == 1) IT.update(1, 1, n, Q[i].l, Q[i].r, Q[i].x);
else cout << IT.getSum(1, 1, n, Q[i].l, Q[i].r) << '\n';
}
}
}
void solve0(int l,int r,int w)
{
int x=id[l],y=id[r];
if(x==y)
{
for(int i=l; i<=r; i++)
{
bit[x].updateRange(pos[i],pos[i],w);
}
return;
}
for(int i=x+1; i<=y-1; i++)
{
lazy[i]+=w;
}
if(R[x]-l+1<=l-1-L[x]+1)
for(int i=l; i<=R[x]; i++)
{
bit[x].updateRange(pos[i],pos[i],w);
}
else
{
lazy[x]+=w;
for(int i=L[x];i<=l-1;i++)
bit[x].updateRange(pos[i],pos[i],-w);
}
if(r-L[y]+1<=R[y]-(r+1)+1)
for(int i=L[y]; i<=r; i++)
{
bit[y].updateRange(pos[i],pos[i],w);
}
else
{
lazy[y]+=w;
for(int i=r+1;i<=R[y];i++)
bit[y].updateRange(pos[i],pos[i],-w);
}
}
void solve1(int l,int r,int w)
{
for(int i=1;i<=cnt;i++)
{
int u=lower_bound(nen[i].begin(),nen[i].end(),l)-nen[i].begin()+1,
v= (r >= nen[i].back() ? nen[i].size() : upper_bound(nen[i].begin()+u-1,nen[i].end(),r)-nen[i].begin());
if(u>v)continue;
if(v-u+1==R[i]-L[i]+1)
lazy[i]+=w;
else
bit[i].updateRange(u,v,w);
}
}
void solve2(int l,int r)
{
int x=id[l],y=id[r];
ll ans=0;
if(x==y)
{
for(int i=l; i<=r; i++)
{
ans+=bit[x].getRange(pos[i],pos[i]);
}
ans+=1LL*(r-l+1)*lazy[x];
cout<<ans<<'\n';
return;
}
for(int i=x+1; i<=y-1; i++)
{
ans+=bit[i].getRange(1,R[i]-L[i]+1)+(R[i]-L[i]+1)*lazy[i];
}
for(int i=l; i<=R[x]; i++)
{
ans+=bit[x].getRange(pos[i],pos[i]);
}
ans+=1LL*(R[x]-l+1)*lazy[x];
for(int i=L[y]; i<=r; i++)
{
ans+=bit[y].getRange(pos[i],pos[i]);
}
ans+=1LL*(r-L[y]+1)*lazy[y];
cout<<ans<<'\n';
}
void solve3(int l,int r)
{
ll ans=0;
for(int i=1;i<=cnt;i++)
{
int u=lower_bound(nen[i].begin(),nen[i].end(),l)-nen[i].begin()+1,
v= (r >= nen[i].back() ? nen[i].size() : upper_bound(nen[i].begin()+u-1,nen[i].end(),r)-nen[i].begin());
ans+=bit[i].getRange(u,v)+1LL*(v-u+1)*lazy[i];
}
cout<<ans<<'\n';
}
signed main()
{
ios_base::sync_with_stdio(0);
cin.tie(0);
cout.tie(0);
#define task "task"
if(fopen(task".inp","r"))
{
freopen(task".inp","r",stdin);
freopen(task".out","w",stdout);
}
cin>>n>>q;
for(int i=1; i<=n; i++)
{
cin>>p[i];
pos[p[i]]=i;
}
FOR(i, 1, q) {
cin >> Q[i].type >> Q[i].l >> Q[i].r;
if (Q[i].type <= 1) cin >> Q[i].x;
}
if (Subtask2 :: check()) {
Subtask2 :: solve();
return 0;
}
cnt=0;
for(int i=1; i<=n; i+=S)
{
cnt++;
L[cnt]=i;
R[cnt]=min(n,i+S-1);
bit[cnt]=FEN(R[cnt]-L[cnt]+1);
for(int j=i; j<=R[cnt]; j++)
{
id[j]=cnt;
nen[cnt].push_back(pos[j]);
}
sort(nen[cnt].begin(),nen[cnt].end());
int j=0;
for(int j=i;j<=R[cnt];j++)
{
pos[j]=lower_bound(nen[cnt].begin(),nen[cnt].end(),pos[j])-nen[cnt].begin()+1;
}
}
FOR(i, 1, q)
{
int t = Q[i].type;
if(t==0)
{
solve0(Q[i].l,Q[i].r,Q[i].x);
}
else if(t==1)
{
solve1(Q[i].l,Q[i].r,Q[i].x);
}
else if(t==2)
{
solve2(Q[i].l,Q[i].r);
}
else
{
solve3(Q[i].l,Q[i].r);
}
}
cerr <<endl<< "TIME : " << clock() * 0.001 << "s" << endl ;
}
#include<bits/stdc++.h>
using namespace std;
static struct FastInput {
  static constexpr int BUF_SIZE = 1 << 20;
  char buf[BUF_SIZE];
  size_t chars_read = 0;
  size_t buf_pos = 0;
  FILE *in = stdin;
  char cur = 0;

  inline char get_char() {
    if (buf_pos >= chars_read) {
      chars_read = fread(buf, 1, BUF_SIZE, in);
      buf_pos = 0;
      buf[0] = (chars_read == 0 ? -1 : buf[0]);
    }
    return cur = buf[buf_pos++];
  }

  inline void tie(int) {}

  inline explicit operator bool() {
    return cur != -1;
  }

  inline static bool is_blank(char c) {
    return c <= ' ';
  }

  inline bool skip_blanks() {
    while (is_blank(cur) && cur != -1) {
      get_char();
    }
    return cur != -1;
  }

  inline FastInput& operator>>(char& c) {
    skip_blanks();
    c = cur;
    return *this;
  }

  inline FastInput& operator>>(string& s) {
    if (skip_blanks()) {
      s.clear();
      do {
        s += cur;
      } while (!is_blank(get_char()));
    }
    return *this;
  }

  template <typename T>
  inline FastInput& read_integer(T& n) {
    // unsafe, doesn't check that characters are actually digits
    n = 0;
    if (skip_blanks()) {
      int sign = +1;
      if (cur == '-') {
        sign = -1;
        get_char();
      }
      do {
        n += n + (n << 3) + cur - '0';
      } while (!is_blank(get_char()));
      n *= sign;
    }
    return *this;
  }

  template <typename T>
  inline typename enable_if<is_integral<T>::value, FastInput&>::type operator>>(T& n) {
    return read_integer(n);
  }

  #if !defined(_WIN32) || defined(_WIN64)
  inline FastInput& operator>>(__int128& n) {
    return read_integer(n);
  }
  #endif

  template <typename T>
  inline typename enable_if<is_floating_point<T>::value, FastInput&>::type operator>>(T& n) {
    // not sure if really fast, for compatibility only
    n = 0;
    if (skip_blanks()) {
      string s;
      (*this) >> s;
      sscanf(s.c_str(), "%lf", &n);
    }
    return *this;
  }
} fast_input;

#define cin fast_input
#define ii pair<int,int>
#define fi first
#define se second
//#define int long long
#define FOR(i, a, b) for(int i = (a); i <= (b); i++)
#define ll long long
#define ld double
#define mp make_pair
#define lg2 30
#define iii pair<int,ii>
#define iiii pair<ii,ii>
#define base 29
#define eps 1e-8
#define MASK(i) (1LL << (i))
#define BIT(S, i) (((S) >> (i)) & 1)
int dx[]= {0LL,0LL,1,-1,1,1,-1,-1};
int dy[]= {1,-1,0LL,0LL,1,-1,1,-1};
const int maxn=1e5+1,S=600,size_S=maxn/S+2;
const int mod=1e9+7;

struct FEN
{
    int n;
    ll bit1[S+1],bit2[S+1];
    FEN() {};
    FEN(int _n):n(_n+1)
    {
    };
    ll get(ll bit[] ,int r)
    {
        ll ret = 0;
        for (; r > 0; r = (r & (r + 1)) - 1)
            ret += bit[r];
        return ret;
    }
    void update(ll bit[],int idx, int delta)
    {
        for (; idx < n; idx = idx | (idx + 1))
            bit[idx] += delta;
    }
    void updateRange(int l, int r, int v)
    {
        update(bit1, l, (n - l + 1) * v);
        update(bit1, r + 1,-(n - r) * v);
        update(bit2, l, v);
        update(bit2, r + 1, -v);
    }
    ll pre(int u)
    {
        return get(bit1, u) - get(bit2, u) *1LL* (n - u);
    }

    ll getRange(int l, int r)
    {
        if(l>r)return 0;
        return pre(r) - (l == 1 ? 0 : pre(l - 1));
    }
} bit[size_S];
int n,L[size_S],R[size_S],q,pos[maxn],p[maxn],cnt,id[maxn];
ll lazy[size_S];
vector<int> nen[size_S];

struct Query {
    int type, l, r, x;
} Q[maxn];

struct SegmentTree {
    int n;
    vector<ll> node, lazy;

    SegmentTree(int n = 0): n(n), node((n << 2) + 5, 0), lazy((n << 2) + 5, 0) {}

    void pushDown(int id, int l, int r) {
        ll &t = lazy[id];
        if (t) {
            int mid = (l + r) >> 1;
            node[id << 1] += t * (mid - l + 1);
            node[id << 1 | 1] += t * (r - mid);
            lazy[id << 1] += t;
            lazy[id << 1 | 1] += t;
            t = 0;
        }
    }

    void update(int id, int l, int r, int u, int v, int k) {
        if (l > v || r < u) return;
        if (u <= l && r <= v) {
            node[id] += 1LL * (r - l + 1) * k;
            lazy[id] += k;
            return;
        }
        pushDown(id, l, r);
        int mid = (l + r) >> 1;
        update(id << 1, l, mid, u, v, k);
        update(id << 1 | 1, mid + 1, r, u, v, k);
        node[id] = node[id << 1] + node[id << 1 | 1];
    }

    ll getSum(int id, int l, int r, int u, int v) {
        if (l > v || r < u) return 0;
        if (u <= l && r <= v) return node[id];
        pushDown(id, l, r);
        int mid = (l + r) >> 1;
        return getSum(id << 1, l, mid, u, v) + getSum(id << 1 | 1, mid + 1, r, u, v);
    }
} IT;

namespace Subtask2 {
    bool check() {
        FOR(i, 1, q) if (Q[i].type != 1 && Q[i].type != 3)
            return false;
        return true;
    }

    void solve() {
		IT = SegmentTree(n);
        FOR(i, 1, q) {
            if (Q[i].type == 1) IT.update(1, 1, n, Q[i].l, Q[i].r, Q[i].x);
            else cout << IT.getSum(1, 1, n, Q[i].l, Q[i].r) << '\n';
        }
    }
}


void solve0(int l,int r,int w)
{
    int x=id[l],y=id[r];
    if(x==y)
    {
        for(int i=l; i<=r; i++)
        {
            bit[x].updateRange(pos[i],pos[i],w);
        }
        return;
    }
    for(int i=x+1; i<=y-1; i++)
    {
        lazy[i]+=w;
    }
    if(R[x]-l+1<=l-1-L[x]+1)
    for(int i=l; i<=R[x]; i++)
    {
        bit[x].updateRange(pos[i],pos[i],w);
    }
    else
    {
        lazy[x]+=w;
        for(int i=L[x];i<=l-1;i++)
        bit[x].updateRange(pos[i],pos[i],-w);
    }
    if(r-L[y]+1<=R[y]-(r+1)+1)
    for(int i=L[y]; i<=r; i++)
    {
        bit[y].updateRange(pos[i],pos[i],w);
    }
    else
    {
        lazy[y]+=w;
        for(int i=r+1;i<=R[y];i++)
        bit[y].updateRange(pos[i],pos[i],-w);
    }
}
void solve1(int l,int r,int w)
{
    for(int i=1;i<=cnt;i++)
    {
        int u=lower_bound(nen[i].begin(),nen[i].end(),l)-nen[i].begin()+1,
            v= (r >= nen[i].back() ? nen[i].size() : upper_bound(nen[i].begin()+u-1,nen[i].end(),r)-nen[i].begin());
            if(u>v)continue;
            if(v-u+1==R[i]-L[i]+1)
            lazy[i]+=w;
           else
            bit[i].updateRange(u,v,w);
    }
}
void solve2(int l,int r)
{
    int x=id[l],y=id[r];
    ll ans=0;
    if(x==y)
    {
        for(int i=l; i<=r; i++)
        {
            ans+=bit[x].getRange(pos[i],pos[i]);
        }
        ans+=1LL*(r-l+1)*lazy[x];
        cout<<ans<<'\n';
        return;
    }
    for(int i=x+1; i<=y-1; i++)
    {
        ans+=bit[i].getRange(1,R[i]-L[i]+1)+(R[i]-L[i]+1)*lazy[i];
    }
    for(int i=l; i<=R[x]; i++)
    {
        ans+=bit[x].getRange(pos[i],pos[i]);
    }
    ans+=1LL*(R[x]-l+1)*lazy[x];
    for(int i=L[y]; i<=r; i++)
    {
        ans+=bit[y].getRange(pos[i],pos[i]);
    }
    ans+=1LL*(r-L[y]+1)*lazy[y];
    cout<<ans<<'\n';
}
void solve3(int l,int r)
{
    ll ans=0;
    for(int i=1;i<=cnt;i++)
    {
        int u=lower_bound(nen[i].begin(),nen[i].end(),l)-nen[i].begin()+1,
            v= (r >= nen[i].back() ? nen[i].size() : upper_bound(nen[i].begin()+u-1,nen[i].end(),r)-nen[i].begin());
            ans+=bit[i].getRange(u,v)+1LL*(v-u+1)*lazy[i];
    }
    cout<<ans<<'\n';
}
signed main()
{
    ios_base::sync_with_stdio(0);
    cin.tie(0);
    cout.tie(0);
#define task "task"
    if(fopen(task".inp","r"))
    {
        freopen(task".inp","r",stdin);
        freopen(task".out","w",stdout);
    }
    cin>>n>>q;
    for(int i=1; i<=n; i++)
    {
         cin>>p[i];
         pos[p[i]]=i;
    }
    FOR(i, 1, q) {
        cin >> Q[i].type >> Q[i].l >> Q[i].r;
        if (Q[i].type <= 1) cin >> Q[i].x;
    }
    if (Subtask2 :: check()) {
        Subtask2 :: solve();
        return 0;
    }
    cnt=0;
    for(int i=1; i<=n; i+=S)
    {
        cnt++;
        L[cnt]=i;
        R[cnt]=min(n,i+S-1);
        bit[cnt]=FEN(R[cnt]-L[cnt]+1);
        for(int j=i; j<=R[cnt]; j++)
        {
            id[j]=cnt;
            nen[cnt].push_back(pos[j]);
        }
        sort(nen[cnt].begin(),nen[cnt].end());
        int j=0;
        for(int j=i;j<=R[cnt];j++)
        {
            pos[j]=lower_bound(nen[cnt].begin(),nen[cnt].end(),pos[j])-nen[cnt].begin()+1;
        }
    }
FOR(i, 1, q)
    {
        int t = Q[i].type;
        if(t==0)
        {
            solve0(Q[i].l,Q[i].r,Q[i].x);
        }
        else if(t==1)
        {
            solve1(Q[i].l,Q[i].r,Q[i].x);
        }
        else if(t==2)
        {
            solve2(Q[i].l,Q[i].r);
        }
        else
        {
            solve3(Q[i].l,Q[i].r);
        }
    }
    cerr <<endl<< "TIME : " << clock() * 0.001 << "s" << endl ;
}