A gradient-based reinforcement learning approach to dynamic pricing in partially-observable environments

David Vengerov. A gradient-based reinforcement learning approach to dynamic pricing in partially-observable environments. Future Generation Comp. Syst., 24(7):687-693, 2008. [doi]

@article{Vengerov08:0,
  title = {A gradient-based reinforcement learning approach to dynamic pricing in partially-observable environments},
  author = {David Vengerov},
  year = {2008},
  doi = {10.1016/j.future.2008.02.012},
  url = {http://dx.doi.org/10.1016/j.future.2008.02.012},
  tags = {rule-based, Meta-Environment, systematic-approach},
  researchr = {https://researchr.org/publication/Vengerov08%3A0},
  cites = {0},
  citedby = {0},
  journal = {Future Generation Comp. Syst.},
  volume = {24},
  number = {7},
  pages = {687-693},
}