Steel model definition, with Dirichlet priors.

In [1]:

from steel_processes import define_processes
processes = define_processes()

/home/rick/anaconda3/envs/bayesian-mfa-paper/lib/python3.6/site-packages/matplotlib/__init__.py:913: UserWarning: axes.color_cycle is deprecated and replaced with axes.prop_cycle; please use the latter.
  warnings.warn(self.msg_depr % (key, alt_key))

In [2]:

import theano
theano.config.mode = 'FAST_RUN'
theano.config.optimizer = 'fast_compile'

Maximum values of inputs:

In [3]:

input_defs = {
    'BF': 5000,
    'DR': 300,
    'SP': 1000,
    'IFC': 300,
}

In [4]:

import pickle
from priors import param_defs
from leontief_model import SplitParamModel

In [5]:

model1 = SplitParamModel(processes, input_defs, param_defs)

In [6]:

with open('model1.pickle', 'wb') as f:
    pickle.dump(model1, f, protocol=pickle.HIGHEST_PROTOCOL)

In [7]:

import pymc3 as pm
RANDOM_SEED = 974067  # from random.org

In [ ]:

with model1.model:
    advi1 = pm.variational.advi(n=10000, random_seed=RANDOM_SEED)
np.savez('results/advi1.npz', advi1)

In [13]:

plt.plot(advi1.elbo_vals[0:]);

In [22]:

def sample(model, advi, trace=None, num_samples=2000):
    step = pm.NUTS(scaling=model.dict_to_array(advi.stds)**2, is_cov=True)
    trace = pm.sample(num_samples, start=advi.means, step=step, trace=trace)
    return trace

In [ ]:

with model1.model:
    trace1 = sample(model1.model, advi1, trace=pm.backends.Text('case_study_global_steel/trace1'))

In [25]:

pm.traceplot(trace1, varnames=['inputs', 'param_OBF', 'param_OBFS']);

Add observations¶

In [8]:

observations1 = [
        (['BF'], ['PI'], 928.4, 50),  # worldsteel: Table 41 - total pig iron
        (['DR'], ['DRI'], 65.8, 6),   # worldsteel: Table 42 - total DRI
        
        (['EAF'], ['EAFS'], 407.0, 40),  # worldsteel: Table 6 - EAF crude steel production
        (['OBF'], ['OBFS'], 891.7, 80),  # worldsteel: Table 6 - OBC crude steel production
        (['OHF'], ['OHFS'], 29.3, 3),    # worldsteel: Table 6 - OHF + other crude steel production
        
        # SEM output, from worldsteel
        (['SEMP'], ['seclight'], 44.4, 2),    # Cullen flow [105]: worldsteel table 16
        (['SEMP'], ['secheavy'], 39.6, 2),    # Cullen flow [106]: worldsteel table 15
        (['SEMP'], ['secrail'], 10.0, 1),     # Cullen flow [107]: worldsteel table 14
        
        # RBM output, from worldsteel
        (['STP'], ['seamlesstube'], 27.2, 2), # Cullen flow [85]: worldsteel table 25
        (['RBMP'], ['rodrebar'], 147.0, 15),  # Cullen flow [108]: worldsteel table 17 (he added extra 26.6 to make it add up)
        (['RBMP'], ['rodwire'], 148.5, 15),   # Cullen flow [109]: worldsteel table 19
        (['RBMP'], ['rodbar'], 109.7, 11),    # Cullen flow [110]: worldsteel table 18
        
        # PLM output, from worldsteel & others
        (['TWP'], ['weldedtube'], 44.5, 4),   # Cullen flow [89]: worldsteel table 26. (he solved as 62.4 to make "apparent consumption" match)
        (['PLMP'], ['plate'], 110.0, 11),     # Cullen flow [111]: SBB value (ref 14, p4)
        
        # HSM output, from worldsteel & SBB
        (['CRMP'], ['elsheet'], 10.3, 2),      # Cullen flow [112]: worldsteel table 20
        (['CRMP'], ['crc'], 135.0, 13),        # Cullen flow [113]: SBB (ref 14, p4)
        (['GPP_CR'], ['crcgalv'], 96.4, 9),    # Cullen flow [114]: worldsteel table 22 (assumed all CRC)
        (['HSMP'], ['hrc'], 150.0, 15),        # Cullen flow [115]: SBB (ref 14, p4)
        (['HSMP'], ['hrns'], 40.0, 4),         # Cullen flow [116]: SBB (ref 14, p4)
        (['GP_HR'], ['hrcgalv'], 10.0, 2),     # Cullen flow [97]: SBB (ref 14, p4)
        (['TM'], ['crctinned'], 11.6, 2),      # Cullen flow [100]: worldsteel table 21 (all tinmill)
        (['OCP'], ['crccoated'], 16.5, 2),     # Cullen flow [103]: worldsteel table 23 (all non-metalic coated)
]

In [9]:

model2 = SplitParamModel(processes, input_defs, param_defs, flow_observations=observations1)

In [10]:

with open('model2.pickle', 'wb') as f:
    pickle.dump(model2, f, protocol=pickle.HIGHEST_PROTOCOL)

In [44]:

with model2.model:
    advi2 = pm.variational.advi(n=10000)
np.savez('case_study_global_steel/advi2.npz', advi2)    

Iteration 0 [0%]: ELBO = -9943.01
Iteration 1000 [10%]: Average ELBO = -38691.52
Iteration 2000 [20%]: Average ELBO = -17266.05
Iteration 3000 [30%]: Average ELBO = -8393.54
Iteration 4000 [40%]: Average ELBO = -4263.99
Iteration 5000 [50%]: Average ELBO = -2281.89
Iteration 6000 [60%]: Average ELBO = -1223.61
Iteration 7000 [70%]: Average ELBO = -903.54
Iteration 8000 [80%]: Average ELBO = -670.74
Iteration 9000 [90%]: Average ELBO = -566.42
Finished [100%]: Average ELBO = -481.78

In [45]:

plt.plot(advi2.elbo_vals[0:]);

In [48]:

with model2.model:
    trace2 = sample(model2.model, advi2, trace=pm.backends.Text('case_study_global_steel/trace2'), num_samples=500)

  0%|          | 0/500 [00:00<?, ?it/s]
  0%|          | 1/500 [00:00<05:34,  1.49it/s]
  1%|          | 3/500 [00:01<04:31,  1.83it/s]
Exception in thread Thread-4:
Traceback (most recent call last):
  File "/home/rick/anaconda3/envs/theano/lib/python3.5/threading.py", line 914, in _bootstrap_inner
    self.run()
  File "/home/rick/anaconda3/envs/theano/lib/python3.5/site-packages/tqdm/_tqdm.py", line 102, in run
    for instance in self.tqdm_cls._instances:
  File "/home/rick/anaconda3/envs/theano/lib/python3.5/_weakrefset.py", line 60, in __iter__
    for itemref in self.data:
RuntimeError: Set changed size during iteration

100%|██████████| 500/500 [31:49<00:00,  4.55s/it]

In [49]:

pm.traceplot(trace2, varnames=['inputs', 'param_OBF', 'param_OBFS', 'Fobs']);

Next data points to add:

Cullen flow [57]: cast iron product. 54 - scrap. 55 - pig iron. 56 - other scrap. 59 - loop
scrap steel input [53] should be 17% of inputs, from considering the dilution. need another observation type?
pig iron to casting is [5] - [12] - [16] - [20], ie. [bf output] - [EAF, OBF, OHF use]
pig iron to EAF is observed [12]
pig iron to OBF [16] comes from yield and scrap input. Scrap is what's left from [10]-[13]-[54].
pig iron to OHF [20] is well defined since there's no scrap input
scrap to OBF is [scrap prepared]-[scrap to EAF: observed]-[scrap to casting: from concentrations]
scrap prepared [10] is given by forming scrap [8] and observed other input. Until I include fabrication scrap, this needs to be an input observation?

Summary:

add pig iron to EAF observation [12]
add scrap input observation [10]
add cast iron production [57]
add cast iron scrap input fraction = 17%
add steel casting production [51]

In [11]:

observations2 = observations1 + [
    (['PI'], ['EAF'], 44.6, 4),   # Cullen flow [12] (ref 2)
    (['SPC'], ['caststeel'], 10.5, 2),    # Cullen flow [51], from ref (11)
    (['IFC'], ['castiron'], 68.3, 6),     # Cullen flow [57], from ref (11)
]

input_observations = [
    (['SP'], 475.5, 40),     # Cullen flow [10]; change if fabrication scrap is added
]

inflow_fraction_observations = [
    (['S'], ['IFC'], 0.17, 0.03),         # Cullen flow [54] -- scrap is 17%.
    # Should be relative to cast iron output, not process throughput.
]

In [12]:

model3 = SplitParamModel(processes, input_defs, param_defs,
                         flow_observations=observations2,
                         input_observations=input_observations,
                         inflow_observations=inflow_fraction_observations)

In [13]:

with open('model3.pickle', 'wb') as f:
    pickle.dump(model3, f, protocol=pickle.HIGHEST_PROTOCOL)

In [64]:

with model3.model:
    advi3 = pm.variational.advi(n=10000)
np.savez('case_study_global_steel/advi3.npz', advi3)

Iteration 0 [0%]: ELBO = -34424.14
Iteration 1000 [10%]: Average ELBO = -85841.01
Iteration 2000 [20%]: Average ELBO = -45837.1
Iteration 3000 [30%]: Average ELBO = -20539.96
Iteration 4000 [40%]: Average ELBO = -9743.25
Iteration 5000 [50%]: Average ELBO = -5146.05
Iteration 6000 [60%]: Average ELBO = -2764.31
Iteration 7000 [70%]: Average ELBO = -1708.03
Iteration 8000 [80%]: Average ELBO = -1210.84
Iteration 9000 [90%]: Average ELBO = -885.6
Finished [100%]: Average ELBO = -678.17

In [67]:

plt.plot(advi3.elbo_vals[0:]);

In [68]:

with model3.model:
    trace3 = sample(model3.model, advi3, trace=pm.backends.Text('case_study_global_steel/trace3'), num_samples=500)

100%|██████████| 500/500 [32:26<00:00,  2.20s/it]

In [ ]:

pm.traceplot(trace3, varnames=['inputs', 'param_OBF', 'param_OBFS', 'Fobs']);