@article{JMLR:v17:14-488,
  author  = {Richard S. Sutton and A. Rupam Mahmood and Martha White},
  title   = {An Emphatic Approach to the Problem of Off-policy Temporal-Difference Learning},
  journal = {Journal of Machine Learning Research},
  year    = {2016},
  volume  = {17},
  number  = {73},
  pages   = {1--29},
  url     = {http://jmlr.org/papers/v17/14-488.html}
}