%%javascript
IPython.OutputArea.prototype._should_scroll = function(lines) {
    return false;
}


import numpy as np
import pandas as pd
import sys
import os
import matplotlib.pyplot as plt
import plotly.graph_objects as go
import urllib.request

import gstlearn as gl
import gstlearn.plot as gp
import gstlearn.plot3D as gop


url = 'https://soft.minesparis.psl.eu/gstlearn/data/Chamaya/Wells.dat'
filepath, head = urllib.request.urlretrieve(url)
mydb = gl.Db.createFromCSV(filepath,gl.CSVformat())
mydb.setLocators(["X","Y"],gl.ELoc.X)
mydb

Data Base Characteristics
=========================

Data Base Summary
-----------------
File is organized as a set of isolated points
Space dimension              = 2
Number of Columns            = 6
Total number of samples      = 189

Variables
---------
Column = 0 - Name = rank - Locator = NA
Column = 1 - Name = X - Locator = x1
Column = 2 - Name = Y - Locator = x2
Column = 3 - Name = top - Locator = NA
Column = 4 - Name = bot - Locator = NA
Column = 5 - Name = appraisal - Locator = NA


dbfmt = gl.DbStringFormat.createFromFlags(True,True,True,True)
mydb.display(dbfmt)

Data Base Characteristics
=========================

Data Base Summary
-----------------
File is organized as a set of isolated points
Space dimension              = 2
Number of Columns            = 6
Total number of samples      = 189

Data Base Extension
-------------------
Coor #1 - Min =     50.000 - Max =   9950.000 - Ext = 9900
Coor #2 - Min =    150.000 - Max =  14950.000 - Ext = 14800

Data Base Statistics
--------------------
1 - Name rank - Locator NA
 Nb of data          =        189
 Nb of active values =        189
 Minimum value       =      1.000
 Maximum value       =    189.000
 Mean value          =     95.000
 Standard Deviation  =     54.559
 Variance            =   2976.667
2 - Name X - Locator x1
 Nb of data          =        189
 Nb of active values =        189
 Minimum value       =     50.000
 Maximum value       =   9950.000
 Mean value          =   4893.386
 Standard Deviation  =   2909.303
 Variance            = 8464043.560
3 - Name Y - Locator x2
 Nb of data          =        189
 Nb of active values =        189
 Minimum value       =    150.000
 Maximum value       =  14950.000
 Mean value          =   8163.757
 Standard Deviation  =   4490.427
 Variance            = 20163937.740
4 - Name top - Locator NA
 Nb of data          =        189
 Nb of active values =        189
 Minimum value       =  -1030.760
 Maximum value       =   -983.260
 Mean value          =  -1007.963
 Standard Deviation  =     10.246
 Variance            =    104.980
5 - Name bot - Locator NA
 Nb of data          =        189
 Nb of active values =        189
 Minimum value       =  -1067.370
 Maximum value       =  -1036.050
 Mean value          =  -1050.542
 Standard Deviation  =      6.903
 Variance            =     47.646
6 - Name appraisal - Locator NA
 Nb of data          =        189
 Nb of active values =        189
 Minimum value       =      0.000
 Maximum value       =      1.000
 Mean value          =      0.265
 Standard Deviation  =      0.441
 Variance            =      0.195

Variables
---------
Column = 0 - Name = rank - Locator = NA
Column = 1 - Name = X - Locator = x1
Column = 2 - Name = Y - Locator = x2
Column = 3 - Name = top - Locator = NA
Column = 4 - Name = bot - Locator = NA
Column = 5 - Name = appraisal - Locator = NA


fig, ax = gp.initGeographic()
ax.symbol(mydb,nameColor="appraisal")
ax.decoration(title="Geometry Information")
plt.show()


mydb["thick"] = mydb["top"] - mydb["bot"]
fig, ax = gp.init()
ax.histogram(mydb, name="thick", bins=30)
plt.show()


mygrid = gl.DbGrid.create(nx=[101,151],dx=[100,100],x0=[50,50])
mygrid

Data Base Grid Characteristics
==============================

Data Base Summary
-----------------
File is organized as a regular grid
Space dimension              = 2
Number of Columns            = 3
Total number of samples      = 15251

Grid characteristics:
---------------------
Origin :     50.000    50.000
Mesh   :    100.000   100.000
Number :        101       151

Variables
---------
Column = 0 - Name = rank - Locator = NA
Column = 1 - Name = x1 - Locator = x1
Column = 2 - Name = x2 - Locator = x2


fig, ax = gp.initGeographic()
ax.cell(mygrid,color='black',step=5)
ax.symbol(mydb)
plt.show()


mydb.setLocator("top", gl.ELoc.Z)
varioparam = gl.VarioParam.createMultiple(ndir=4, npas=15, dpas=500)
vario_top = gl.Vario.computeFromDb(varioparam, mydb)


fig, ax = gp.init()
ax.variogram(vario_top,idir=-1,flagLegend=True)
plt.show()


vmap_top = gl.db_vmap_compute(mydb,gl.ECalcVario.VARIOGRAM,[20,20])

fig, ax = gp.initGeographic()
ax.raster(vmap_top, "*Var")
ax.decoration(title="Variogram Map for Top")
plt.show()


model_top = gl.Model()
err = model_top.fit(vario_top)
model_top

Model characteristics
=====================
Space dimension              = 2
Number of variable(s)        = 1
Number of basic structure(s) = 1
Number of drift function(s)  = 0
Number of drift equation(s)  = 0

Covariance Part
---------------
Spherical
- Sill         =    157.461
- Ranges       =  24037.055  5003.649
- Angles       =     21.202     0.000
- Rotation Matrix
               [,  0]    [,  1]
     [  0,]     0.932    -0.362
     [  1,]     0.362     0.932
Total Sill     =    157.461


fig, ax = gp.init()
ax = gp.varmod(vario_top, model_top)
plt.show()


mydb.setLocator("bot", gl.ELoc.Z)
varioparam = gl.VarioParam.createMultiple(ndir=4, npas=15, dpas=500)
vario_bot = gl.Vario.computeFromDb(varioparam, mydb)

fig, ax = gp.init()
ax.variogram(vario_bot,idir=-1,flagLegend=True)
plt.show()


vmap_bot = gl.db_vmap_compute(mydb,gl.ECalcVario.VARIOGRAM,[20,20])

fig, ax = gp.initGeographic()
ax.raster(vmap_bot, "*Var")
ax.decoration(title="Variogram Map for Bottom")
plt.show()


types = gl.ECov.fromKeys(["SPHERICAL","EXPONENTIAL"])
model_bot = gl.Model()
err = model_bot.fit(vario_bot, types)
model_bot

Model characteristics
=====================
Space dimension              = 2
Number of variable(s)        = 1
Number of basic structure(s) = 2
Number of drift function(s)  = 0
Number of drift equation(s)  = 0

Covariance Part
---------------
Spherical
- Sill         =     11.914
- Ranges       =   2811.249   986.432
- Angles       =     25.340     0.000
- Rotation Matrix
               [,  0]    [,  1]
     [  0,]     0.904    -0.428
     [  1,]     0.428     0.904
Exponential
- Sill         =    103.277
- Ranges       =  95677.717 24735.006
- Theo. Ranges =  31938.010  8256.749
- Angles       =    353.264     0.000
- Rotation Matrix
               [,  0]    [,  1]
     [  0,]     0.993     0.117
     [  1,]    -0.117     0.993
Total Sill     =    115.190


fig, ax = gp.init()
ax = gp.varmod(vario_bot, model_bot)
plt.show()


mydb.setLocator("thick", gl.ELoc.Z)
varioparam = gl.VarioParam.createMultiple(ndir=4, npas=15, dpas=500)
vario_thick = gl.Vario.computeFromDb(varioparam, mydb)

fig, ax = gp.init()
ax.variogram(vario_thick,idir=-1,flagLegend=True)
plt.show()


vmap_thick = gl.db_vmap_compute(mydb,gl.ECalcVario.VARIOGRAM,[20,20])

fig, ax = gp.initGeographic()
ax.raster(vmap_thick, "*Var")
ax.decoration(title="Variogram Map for Thickness")
plt.show()


types = gl.ECov.fromKeys(["SPHERICAL"])
model_thick = gl.Model()
err = model_thick.fit(vario_thick, types)
model_thick

Model characteristics
=====================
Space dimension              = 2
Number of variable(s)        = 1
Number of basic structure(s) = 1
Number of drift function(s)  = 0
Number of drift equation(s)  = 0

Covariance Part
---------------
Spherical
- Sill         =    124.911
- Ranges       =   9102.815  4618.492
- Angles       =     23.011     0.000
- Rotation Matrix
               [,  0]    [,  1]
     [  0,]     0.920    -0.391
     [  1,]     0.391     0.920
Total Sill     =    124.911


fig, ax = gp.init()
ax = gp.varmod(vario_thick, model_thick)
plt.show()


model = gl.Model.createFromParam(type = gl.ECov.CUBIC, range=2000)


err = gl.nearestNeighbor(mydb, mygrid, flag_std=True, model=model)


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="Nearest.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Nearest Neighbor")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="Nearest.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Nearest Neighbor (stdev)")
plt.show()


neigh_small = gl.NeighMoving.create(radius=5000, nmaxi=5)
err = gl.movingAverage(mydb, mygrid, neigh_small, flag_std=True, model=model)


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovAve.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Average (Small Neighborhood)")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovAve.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Average (Small Neighborhood) (stdev)")
plt.show()


neigh_large = gl.NeighMoving.create(radius=5000, nmaxi=20)
err = gl.movingAverage(mydb, mygrid, neigh_large, flag_std=True, model = model,
                       namconv=gl.NamingConvention("MovAve_Large"))


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovAve_Large.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Average (Large Neighborhood)")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovAve_Large.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Average (Large Neighborhood) (stdev)")
plt.show()


err = gl.inverseDistance(mydb, mygrid, dmax = 2000, flag_std=True, model=model)


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="InvDist.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Inverse (squared) distance")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="InvDist.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Inverse (squared) distance (stdev)")
plt.show()


err = gl.movingMedian(mydb, mygrid, neigh_small, flag_std=True, model=model)


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovMed.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Median (Small Neighborhood)")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovMed.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Median (Small Neighborhood) (stdev)")
plt.show()


err = gl.movingAverage(mydb, mygrid, neigh_large, flag_std=True, model=model,
                       namconv=gl.NamingConvention("MovMed_Large"))


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovMed.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Median (Large Neighborhood)")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="MovMed.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Moving Median (Large Neighborhood) (stdev)")
plt.show()


surface = gop.SurfaceOnDbGrid(mygrid, "MovMed_Large.thick.estim", showscale=False)
fig = go.Figure(data = [ surface ])
fig.update_layout(autosize=True, 
                  scene_aspectmode='manual', scene_aspectratio=dict(x=1,y=1,z=0.2))
f = fig.show()


neigh_moving = gl.NeighMoving.create(radius=2000, nmaxi=8)

node = 8030
res = gl.krigtest(mydb, mygrid, model_thick, neigh_moving, iech0=node, verbose=False)


fig, ax = gp.initGeographic()
ax.symbol(mydb, c='black')
ax.neigh(neigh_moving, mygrid, node, flagZoom=True)
ax.neighWeights(res)
plt.show()


neigh_moving = gl.NeighMoving.create(radius=2000, nsect=6, nsmax=2)

res = gl.krigtest(mydb, mygrid, model_thick, neigh_moving, iech0=node, verbose=False)
fig, ax = gp.initGeographic()
ax.symbol(mydb, c='black')
ax.neigh(neigh_moving, mygrid, node, flagZoom=True)
ax.neighWeights(res)
plt.show()


fig, ax = gp.init()
ax = gp.varmod(vario_thick, model_thick, showPairs=True)
plt.show()


types = gl.ECov.fromKeys(["NUGGET","SPHERICAL"])
model_thick2 = gl.Model()
err = model_thick2.fit(vario_thick, types)

fig, ax = gp.init()
ax = gp.varmod(vario_thick, model_thick2, showPairs=True)
plt.show()


res = gl.krigtest(mydb, mygrid, model_thick2, neigh_moving, iech0=node, verbose=False)
fig, ax = gp.initGeographic()
ax.symbol(mydb, c='black')
ax.neigh(neigh_moving, mygrid, node, flagZoom=True)
ax.neighWeights(res)
plt.show()


err = gl.xvalid(mydb, model_thick, neigh_moving, flag_xvalid_est=-1)


fig, axs = plt.subplots(2,2, figsize=(10,10))
axs[0,0].symbol(mydb,nameSize="Xvalid.*.stderr", flagAbsSize=True)
axs[0,0].decoration(title="Standardized Errors (absolute value)")
axs[0,0].set_aspect(1)
axs[0,1].histogram(mydb, name="Xvalid.*.stderr", bins=20)
axs[0,1].axvline(-2.5, color='black', linestyle='dashed')
axs[0,1].axvline(2.5, color='black', linestyle='dashed')
axs[0,1].decoration(title="Histogram of Standardized Errors")
axs[1,0].correlation(mydb, namey="Xvalid.*.stderr", namex="Xvalid.*.estim", 
                     asPoint=True)
axs[1,0].decoration(xlabel="Estimation", ylabel="Standardized Error")
axs[1,0].axhline(-2.5, color='black', linestyle='dashed')
axs[1,0].axhline(   0, color='black', linestyle='solid')
axs[1,0].axhline( 2.5, color='black', linestyle='dashed')
axs[1,1].correlation(mydb, namey="thick", namex="Xvalid.*.estim", 
                     asPoint=True, diagLine=True, flagSameAxes=True)
axs[1,1].decoration(xlabel="Estimation", ylabel="True Value")
plt.show()


mydb.setLocator("thick", gl.ELoc.Z)
neigh_moving = gl.NeighMoving.create(radius=5000, nsect=6, nsmax=5)

err = gl.kriging(mydb, mygrid, model_thick, neigh_moving)


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="Kriging.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Thickness: Estimation")
plt.show()


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="Kriging.thick.stdev",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Thickness: Standard deviation of Estimation error")
plt.show()


mydb.setLocators(["top","thick"],gl.ELoc.Z)
vario_multi = gl.Vario.computeFromDb(varioparam, mydb)

types = gl.ECov.fromKeys(["EXPONENTIAL", "SPHERICAL"])
model_multi = gl.Model()
err = model_multi.fit(vario_multi, types)


model_multi

Model characteristics
=====================
Space dimension              = 2
Number of variable(s)        = 2
Number of basic structure(s) = 2
Number of drift function(s)  = 0
Number of drift equation(s)  = 0

Covariance Part
---------------
Exponential
- Sill matrix:
               [,  0]    [,  1]
     [  0,]     4.561    17.075
     [  1,]    17.075    63.923
- Ranges       =   6933.278  6452.664
- Theo. Ranges =   2314.385  2153.952
- Angles       =     23.709     0.000
- Rotation Matrix
               [,  0]    [,  1]
     [  0,]     0.916    -0.402
     [  1,]     0.402     0.916
Spherical
- Sill matrix:
               [,  0]    [,  1]
     [  0,]   151.897   100.451
     [  1,]   100.451    69.070
- Ranges       =  23190.112  4994.942
- Angles       =     22.305     0.000
- Rotation Matrix
               [,  0]    [,  1]
     [  0,]     0.925    -0.380
     [  1,]     0.380     0.925
Total Sill
               [,  0]    [,  1]
     [  0,]   156.458   117.526
     [  1,]   117.526   132.992


fig, axs = gp.init(2,2)
fig.varmod(vario_multi, model_multi)
plt.show()


err = gl.kriging(mydb, mygrid, model_multi, neigh_moving, namconv=gl.NamingConvention("CoKriging"))


fig, ax = gp.initGeographic()
ax.raster(mygrid, name="CoKriging.thick.estim",flagLegend=True)
ax.symbol(mydb, c='black')
ax.decoration(title="Thickness: Estimation (CoKriging)")
plt.show()


mygrid["CoKriging.bot.estim"] = mygrid["CoKriging.top.estim"] - mygrid["CoKriging.thick.estim"]


surf_top = gop.SurfaceOnDbGrid(mygrid, "CoKriging.top.estim")
surf_bot = gop.SurfaceOnDbGrid(mygrid, "CoKriging.bot.estim")
fig = go.Figure(data = [ surf_top, surf_bot])
f = fig.show()

Study of a Reservoir¶

Import packages¶

Reading data¶

Estimation¶

Structural analysis of the variables¶

Analysis of the top variable¶

Analysis of the bottom variable¶

Analysis of the thickness variable¶

Traditional Estimation methods¶

The nearest neighbor method¶

The moving average method¶

The inverse (squared) distance¶

The moving median¶

Kriging Method¶

Neighborhood search¶

Kriging Weights¶

Cross-Validation¶

Estimation map¶

Standard deviation map¶

Processing the information jointly¶

Multivariate structural analysis¶

Joint estimation¶