Skip to content

Commit 1987c85

Browse files
idavisorpuente-MS
andauthored
Add ability to parse quantum decls and lit exprs (#2160)
Co-authored-by: Oscar Puente <[email protected]>
1 parent 2319775 commit 1987c85

File tree

11 files changed

+1417
-140
lines changed

11 files changed

+1417
-140
lines changed

compiler/qsc_qasm3/src/ast.rs

+25-22
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@
55
#![allow(dead_code)]
66

77
use indenter::{indented, Indented};
8+
use num_bigint::BigInt;
89
use qsc_data_structures::span::{Span, WithSpan};
910
use std::{
1011
fmt::{self, Display, Formatter, Write},
@@ -1037,7 +1038,7 @@ impl Display for IncludeStmt {
10371038
#[derive(Clone, Debug)]
10381039
pub struct QubitDeclaration {
10391040
pub span: Span,
1040-
pub qubit: Identifier,
1041+
pub qubit: Ident,
10411042
pub size: Option<ExprStmt>,
10421043
}
10431044

@@ -1571,7 +1572,7 @@ pub enum ExprKind {
15711572
Ident(Ident),
15721573
UnaryExpr(UnaryExpr),
15731574
BinaryExpr(BinaryExpr),
1574-
Literal(Lit),
1575+
Lit(Lit),
15751576
FunctionCall(FunctionCall),
15761577
Cast(Cast),
15771578
Concatenation(Concatenation),
@@ -1583,14 +1584,14 @@ impl Display for ExprKind {
15831584
let indent = set_indentation(indented(f), 0);
15841585
match self {
15851586
ExprKind::Err => write!(f, "Err"),
1586-
ExprKind::Ident(id) => write!(f, "Ident {id}"),
1587-
ExprKind::UnaryExpr(expr) => write!(f, "UnaryExpr {expr}"),
1587+
ExprKind::Ident(id) => write!(f, "{id}"),
1588+
ExprKind::UnaryExpr(expr) => write!(f, "{expr}"),
15881589
ExprKind::BinaryExpr(expr) => display_bin_op(indent, expr),
1589-
ExprKind::Literal(lit) => write!(f, "Literal {lit}"),
1590-
ExprKind::FunctionCall(call) => write!(f, "FunctionCall {call}"),
1591-
ExprKind::Cast(cast) => write!(f, "Cast {cast}"),
1592-
ExprKind::Concatenation(concat) => write!(f, "Concatenation {concat}"),
1593-
ExprKind::IndexExpr(index) => write!(f, "IndexExpr {index}"),
1590+
ExprKind::Lit(lit) => write!(f, "{lit}"),
1591+
ExprKind::FunctionCall(call) => write!(f, "{call}"),
1592+
ExprKind::Cast(cast) => write!(f, "{cast}"),
1593+
ExprKind::Concatenation(concat) => write!(f, "{concat}"),
1594+
ExprKind::IndexExpr(index) => write!(f, "{index}"),
15941595
}
15951596
}
15961597
}
@@ -1740,19 +1741,20 @@ pub struct Lit {
17401741

17411742
impl Display for Lit {
17421743
fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
1743-
write!(f, "Lit {}: {}", self.span, self.kind)
1744+
write!(f, "Lit: {}", self.kind)
17441745
}
17451746
}
17461747

17471748
#[derive(Clone, Debug)]
17481749
pub enum LiteralKind {
17491750
Array(List<ExprStmt>),
1750-
Bitstring { value: usize, width: u32 },
1751-
Boolean(bool),
1751+
Bitstring(BigInt, usize),
1752+
Bool(bool),
17521753
Duration { value: f64, unit: TimeUnit },
17531754
Float(f64),
17541755
Imaginary(f64),
1755-
Integer(i64),
1756+
Int(i64),
1757+
BigInt(BigInt),
17561758
String(Rc<str>),
17571759
}
17581760

@@ -1764,21 +1766,22 @@ impl Display for LiteralKind {
17641766
write!(indent, "Array:")?;
17651767
indent = set_indentation(indent, 1);
17661768
for expr in exprs {
1767-
write!(indent, "\n{expr}")?;
1769+
write!(indent, "\n{expr:?}")?;
17681770
}
17691771
Ok(())
17701772
}
1771-
LiteralKind::Bitstring { value, width } => {
1772-
write!(f, "Bitstring: {value} (width {width})")
1773+
LiteralKind::Bitstring(value, width) => {
1774+
write!(f, "Bitstring(\"{:0>width$}\")", value.to_str_radix(2))
17731775
}
1774-
LiteralKind::Boolean(b) => write!(f, "Boolean: {b}"),
1776+
LiteralKind::Bool(b) => write!(f, "Bool({b:?})"),
17751777
LiteralKind::Duration { value, unit } => {
1776-
write!(f, "Duration: {value} {unit}")
1778+
write!(f, "Duration({value:?}, {unit:?})")
17771779
}
1778-
LiteralKind::Float(value) => write!(f, "Float: {value}"),
1779-
LiteralKind::Imaginary(value) => write!(f, "Imaginary: {value} im"),
1780-
LiteralKind::Integer(i) => write!(f, "Integer: {i}"),
1781-
LiteralKind::String(s) => write!(f, "String: {s}"),
1780+
LiteralKind::Float(value) => write!(f, "Float({value:?})"),
1781+
LiteralKind::Imaginary(value) => write!(f, "Imaginary({value:?})"),
1782+
LiteralKind::Int(i) => write!(f, "Int({i:?})"),
1783+
LiteralKind::BigInt(i) => write!(f, "BigInt({i:?})"),
1784+
LiteralKind::String(s) => write!(f, "String({s:?})"),
17821785
}
17831786
}
17841787
}

compiler/qsc_qasm3/src/lex/cooked.rs

+61-7
Original file line numberDiff line numberDiff line change
@@ -49,6 +49,10 @@ pub enum Error {
4949
#[diagnostic(code("Qasm3.Lex.UnterminatedString"))]
5050
UnterminatedString(#[label] Span),
5151

52+
#[error("string literal with an invalid escape sequence")]
53+
#[diagnostic(code("Qasm3.Lex.InvalidEscapeSequence"))]
54+
InvalidEscapeSequence(#[label] Span),
55+
5256
#[error("unrecognized character `{0}`")]
5357
#[diagnostic(code("Qasm3.Lex.UnknownChar"))]
5458
Unknown(char, #[label] Span),
@@ -64,6 +68,7 @@ impl Error {
6468
Self::IncompleteEof(expected, token, span + offset)
6569
}
6670
Self::UnterminatedString(span) => Self::UnterminatedString(span + offset),
71+
Self::InvalidEscapeSequence(span) => Self::InvalidEscapeSequence(span + offset),
6772
Self::Unknown(c, span) => Self::Unknown(c, span + offset),
6873
}
6974
}
@@ -73,6 +78,7 @@ impl Error {
7378
Error::Incomplete(_, _, _, s)
7479
| Error::IncompleteEof(_, _, s)
7580
| Error::UnterminatedString(s)
81+
| Error::InvalidEscapeSequence(s)
7682
| Error::Unknown(_, s) => s,
7783
}
7884
}
@@ -82,6 +88,7 @@ impl Error {
8288
#[derive(Clone, Copy, Debug, Eq, PartialEq, Sequence)]
8389
pub enum TokenKind {
8490
Annotation,
91+
Pragma,
8592
Keyword(Keyword),
8693
Type(Type),
8794

@@ -118,7 +125,6 @@ pub enum TokenKind {
118125
PlusPlus,
119126
/// `->`
120127
Arrow,
121-
At,
122128

123129
// Operators,
124130
ClosedBinOp(ClosedBinOp),
@@ -141,6 +147,7 @@ impl Display for TokenKind {
141147
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
142148
match self {
143149
TokenKind::Annotation => write!(f, "annotation"),
150+
TokenKind::Pragma => write!(f, "pragma"),
144151
TokenKind::Keyword(keyword) => write!(f, "keyword `{keyword}`"),
145152
TokenKind::Type(type_) => write!(f, "keyword `{type_}`"),
146153
TokenKind::GPhase => write!(f, "gphase"),
@@ -166,7 +173,6 @@ impl Display for TokenKind {
166173
TokenKind::Comma => write!(f, "`,`"),
167174
TokenKind::PlusPlus => write!(f, "`++`"),
168175
TokenKind::Arrow => write!(f, "`->`"),
169-
TokenKind::At => write!(f, "`@`"),
170176
TokenKind::ClosedBinOp(op) => write!(f, "`{op}`"),
171177
TokenKind::BinOpEq(op) => write!(f, "`{op}=`"),
172178
TokenKind::ComparisonOp(op) => write!(f, "`{op}`"),
@@ -273,7 +279,6 @@ impl FromStr for Type {
273279
#[derive(Clone, Copy, Debug, Eq, PartialEq, Sequence)]
274280
pub enum Literal {
275281
Bitstring,
276-
Boolean,
277282
Float,
278283
Imaginary,
279284
Integer(Radix),
@@ -285,7 +290,6 @@ impl Display for Literal {
285290
fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
286291
f.write_str(match self {
287292
Literal::Bitstring => "bitstring",
288-
Literal::Boolean => "boolean",
289293
Literal::Float => "float",
290294
Literal::Imaginary => "imaginary",
291295
Literal::Integer(_) => "integer",
@@ -459,6 +463,23 @@ impl<'a> Lexer<'a> {
459463
tokens.next().map(|i| i.kind)
460464
}
461465

466+
/// Consumes the characters while they satisfy `f`. Returns the last character eaten, if any.
467+
fn eat_while(&mut self, mut f: impl FnMut(raw::TokenKind) -> bool) -> Option<raw::TokenKind> {
468+
let mut last_eaten: Option<raw::Token> = None;
469+
loop {
470+
let t = self.tokens.next_if(|t| f(t.kind));
471+
if t.is_none() {
472+
return last_eaten.map(|t| t.kind);
473+
}
474+
last_eaten = t;
475+
}
476+
}
477+
478+
fn eat_to_end_of_line(&mut self) {
479+
self.eat_while(|t| t != raw::TokenKind::Newline);
480+
self.next_if_eq(raw::TokenKind::Newline);
481+
}
482+
462483
/// Consumes a list of tokens zero or more times.
463484
fn kleen_star(&mut self, tokens: &[raw::TokenKind], complete: TokenKind) -> Result<(), Error> {
464485
let mut iter = tokens.iter();
@@ -471,6 +492,7 @@ impl<'a> Lexer<'a> {
471492
Ok(())
472493
}
473494

495+
#[allow(clippy::too_many_lines)]
474496
fn cook(&mut self, token: &raw::Token) -> Result<Option<Token>, Error> {
475497
let kind = match token.kind {
476498
raw::TokenKind::Bitstring { terminated: true } => {
@@ -487,7 +509,13 @@ impl<'a> Lexer<'a> {
487509
}
488510
raw::TokenKind::Ident => {
489511
let ident = &self.input[(token.offset as usize)..(self.offset() as usize)];
490-
Ok(Some(Self::ident(ident)))
512+
let cooked_ident = Self::ident(ident);
513+
if matches!(cooked_ident, TokenKind::Keyword(Keyword::Pragma)) {
514+
self.eat_to_end_of_line();
515+
Ok(Some(TokenKind::Pragma))
516+
} else {
517+
Ok(Some(cooked_ident))
518+
}
491519
}
492520
raw::TokenKind::HardwareQubit => Ok(Some(TokenKind::HardwareQubit)),
493521
raw::TokenKind::LiteralFragment(_) => {
@@ -525,6 +553,26 @@ impl<'a> Lexer<'a> {
525553
_ => Ok(Some(number.into())),
526554
}
527555
}
556+
raw::TokenKind::Single(Single::Sharp) => {
557+
let complete = TokenKind::Pragma;
558+
self.expect(raw::TokenKind::Ident, complete)?;
559+
let ident = &self.input[(token.offset as usize + 1)..(self.offset() as usize)];
560+
if matches!(Self::ident(ident), TokenKind::Keyword(Keyword::Pragma)) {
561+
self.eat_to_end_of_line();
562+
Ok(Some(complete))
563+
} else {
564+
let span = Span {
565+
lo: token.offset,
566+
hi: self.offset(),
567+
};
568+
Err(Error::Incomplete(
569+
raw::TokenKind::Ident,
570+
complete,
571+
raw::TokenKind::Ident,
572+
span,
573+
))
574+
}
575+
}
528576
raw::TokenKind::Single(single) => self.single(single).map(Some),
529577
raw::TokenKind::String { terminated: true } => {
530578
Ok(Some(TokenKind::Literal(Literal::String)))
@@ -565,7 +613,13 @@ impl<'a> Lexer<'a> {
565613
Ok(self.closed_bin_op(ClosedBinOp::Amp))
566614
}
567615
}
568-
Single::At => Ok(TokenKind::At),
616+
Single::At => {
617+
// AnnotationKeyword: '@' Identifier ('.' Identifier)* -> pushMode(EAT_TO_LINE_END);
618+
let complete = TokenKind::Annotation;
619+
self.expect(raw::TokenKind::Ident, complete);
620+
self.eat_to_end_of_line();
621+
Ok(complete)
622+
}
569623
Single::Bang => {
570624
if self.next_if_eq_single(Single::Eq) {
571625
Ok(TokenKind::ComparisonOp(ComparisonOp::BangEq))
@@ -627,6 +681,7 @@ impl<'a> Lexer<'a> {
627681
}
628682
}
629683
Single::Semi => Ok(TokenKind::Semicolon),
684+
Single::Sharp => unreachable!(),
630685
Single::Slash => Ok(self.closed_bin_op(ClosedBinOp::Slash)),
631686
Single::Star => {
632687
if self.next_if_eq_single(Single::Star) {
@@ -659,7 +714,6 @@ impl<'a> Lexer<'a> {
659714
"delay" => TokenKind::Delay,
660715
"reset" => TokenKind::Reset,
661716
"measure" => TokenKind::Measure,
662-
"false" | "true" => TokenKind::Literal(Literal::Boolean),
663717
ident => {
664718
if let Ok(keyword) = ident.parse::<Keyword>() {
665719
TokenKind::Keyword(keyword)

0 commit comments

Comments
 (0)