BibTeX record journals/corr/abs-2404-11049

download as .bib file

@article{DBLP:journals/corr/abs-2404-11049,
  author       = {Akifumi Wachi and
                  Thien Q. Tran and
                  Rei Sato and
                  Takumi Tanabe and
                  Yohei Akimoto},
  title        = {Stepwise Alignment for Constrained Language Model Policy Optimization},
  journal      = {CoRR},
  volume       = {abs/2404.11049},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.11049},
  doi          = {10.48550/ARXIV.2404.11049},
  eprinttype    = {arXiv},
  eprint       = {2404.11049},
  timestamp    = {Wed, 22 May 2024 08:50:15 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-11049.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}