Difference between revisions of "Strings"

partial

 (set-logic QF_S)

 (set-logic S)

 (set-option :strings-exp true)

 (set-option :strings-fmf true)

 (set-option :strings-lb 1)

 (set-option :strings-alphabet-card n)

 (declare-fun x () String)

 (str.++ s1 s2 ... sn)

 (str.len s)

 (str.at s i)

 (str.substr s i j )

 (str.in.re s r)

 (str.to.re s)

 (re.++ r_1 r_2 ... r_n)

 (re.union r_1 r_2 ... r_n)

 (re.inter r_1 r_2 ... r_n)

 (re.* r)

 (re.+ r)

 (re.opt r)

 (re.range s t)

 (re.loop r l u)

 (re.loop r l)

 re.nostr

 re.allchar

 (str.at s i)

 (str.substr s i j)

 (str.contains s t)

(str.indexof s t i)

(str.replace s t1 t2)

(str.prefixof s t)

(str.suffixof s t)

(str.to.int s)

(int.to.str i)

 (assert (= (str.substr "a" 2 10) "b"))

 (assert (= (str.substr "a" 2 1) "b"))
 (assert (= (str.substr "a" 2 1) "c"))

 (assert (= (str.at x j) "b"))
 (assert (> j 0))
 (assert (> (str.len x) j))

 (define-fun fun1 ((?x String) (?s String)) Bool
   (or (= ?x ?s)
       (> (str.len ?x) (str.len ?s))
    ))

 (set-logic QF_S)
 
 (declare-fun x () String)
 
 (assert (= (str.++ x "ab") (str.++ "ba" x)))
 (assert (= (str.len x) 7))
 
 (check-sat)

 (set-logic QF_S)
 
 (declare-fun x () String)
 (declare-fun y () String)
 
 (assert (not (=  x y)))
 (assert (= (str.len x) (str.len y)))
 
 (check-sat)

 (set-logic QF_S)
 
 (declare-fun x () String)
 (declare-fun y () String)
 (assert (not (= (str.++ x y) (str.++ y x))))
 
 (check-sat)

 (set-logic QF_S)
 
 (declare-fun x () String)
 (declare-fun y () String)
 (declare-fun z () String)
 
 (assert (= (str.++ x "ab" y) (str.++ y "ba" z)))
 (assert (= z (str.++ x y)))
 (assert (not (= (str.++ x "a") (str.++ "a" x))))
 
 (check-sat)

 (set-logic QF_S)
 (set-option :strings-fmf true)
 
 (declare-fun x () String)
 (declare-fun y () String)
 
 (assert
   (str.in.re x
      (re.* (re.++ (re.* (str.to.re "a") ) (str.to.re "b") ))))
 (assert (str.in.re y
      (re.* (re.++ (re.* (str.to.re "a") ) (str.to.re "b") ))))
 
 (assert (not (= x y)))
 (assert (= (str.len x) (str.len y)))
 
 (check-sat)

 smt.setLogic("S");

 Type string = em.stringType();

 // std::string
 std::string std_str_ab("ab");
 // CVC4::String
 CVC4::String cvc4_str_ab(std_str_ab);
 CVC4::String cvc4_str_abc("abc");
 // String constants
 Expr ab = em.mkConst(cvc4_str_ab);
 Expr abc = em.mkConst(CVC4::String("abc"));

 Expr x = em.mkVar("x", string);
 Expr y = em.mkVar("y", string);
 Expr z = em.mkVar("z", string);

 // String concatenation: x.ab.y
 Expr lhs = em.mkExpr(kind::STRING_CONCAT, x, ab, y);
 // String concatenation: abc.z
 Expr rhs = em.mkExpr(kind::STRING_CONCAT, abc, z);
 // x.ab.y = abc.z
 Expr formula1 = em.mkExpr(kind::EQUAL, lhs, rhs);
 // Length of y: |y|
 Expr leny = em.mkExpr(kind::STRING_LENGTH, y);
 // |y| >= 0
 Expr formula2 = em.mkExpr(kind::GEQ, leny, em.mkConst(Rational(0)));
 // Regular expression: (ab[c-e]*f)|g|h
 Expr r = em.mkExpr(kind::REGEXP_UNION,
 em.mkExpr(kind::REGEXP_CONCAT,
 em.mkExpr(kind::STRING_TO_REGEXP, em.mkConst(String("ab"))),
 em.mkExpr(kind::REGEXP_STAR,
 em.mkExpr(kind::REGEXP_RANGE, em.mkConst(String("c")), em.mkConst(String("e")))),
 em.mkExpr(kind::STRING_TO_REGEXP, em.mkConst(String("f")))),
 em.mkExpr(kind::STRING_TO_REGEXP, em.mkConst(String("g"))),
 em.mkExpr(kind::STRING_TO_REGEXP, em.mkConst(String("h"))));
 // String variables
 Expr s1 = em.mkVar("s1", string);
 Expr s2 = em.mkVar("s2", string);
 // String concatenation: s1.s2
 Expr s = em.mkExpr(kind::STRING_CONCAT, s1, s2);
 // s1.s2 in (ab[c-e]*f)|g|h
 Expr formula3 = em.mkExpr(kind::STRING_IN_REGEXP, s, r);

 Expr q = em.mkExpr(kind::AND,
   formula1,
   formula2,
   formula3);

 Result result = smt.checkSat(q);
 std::cout << "CVC4 reports: " << q << " is " << result << "." << std::endl;
 if(result == Result::SAT) {
   std::cout << " x = " << smt.getValue(x) << std::endl;
   std::cout << " s1.s2 = " << smt.getValue(s) << std::endl;
 }

@@ Line 6: / Line 6: @@
 '''We highly recommend that users use SMT-LIB [http://smt-lib.org/language.shtml Version 2.5], instead of Version 2.0.''' The major difference is in the definition of escape sequences for string literals.
-'''The syntax below is for CVC4 version > 1.4. Version 1.3 has only has ''partial'' support for syntax in this document.'''
+'''The syntax below is for CVC4 version > 1.4.''' Version 1.3 has only has ''partial'' support for syntax in this document.
-Since the string subsolver is still relatively new, the current stable version of CVC4 (1.4) does not provide the latest version of that subsolver.  Please use our '''latest Development version instead'''.
+Since the string (sub)solver is still relatively new, the current stable version of CVC4 (1.4) does not provide the latest version of that solver.  Please use our latest Development version instead.
-This string solver has a full support of '''ASCII''' characters. For arbitrary alphabets, please refer to sequence (parametrized string) theory.
+Currently, the string solver supports string constants over a set characters limited to printable ASCII characters. Other characters ''must'' be encoded with escape sequences. For arbitry alphabets, we plan to provide later a separate solver for a theory of parametric sequences.
-In compliance with SMT-Lib v2, only printable basic ASCII characters are allowed to be appeared natively in string literals. Other ASCII characters '''must''' be encoded as escape sequences.
+To use the string solver it is important to declare initially (using the <code>set-logic</code> command) an SMT-LIB logic that includes strings. Since the SMT-LIB standard does not have an official theory of strings and related logics yet, the logic names described below are tentive and might change later.
-The Theory of Strings (Quantifier-Free) logic symbol:
+The basic logic is <code>QF_S</code> consisting of quanfier-free formulas over just the theory of strings, e.g., :
    (set-logic QF_S)
-The logic symbol is '''IMPORTANT''' to the Theory of String, and it has to be set up.
+If the formulas contain sybols from theories, please add them accordingly, e.g., if the formulas contain symbols from the BitVector theory, the logic symbol should be <code>QF_SBV</code>.
-If the constraints contain more theories, please add them accordingly, e.g. if it contains BitVector, the symbol should be QF_SBV.
+The logic consisting of the full (quantified) theory strings is <code>QF_SBV</code>:
-The Theory of Quantified Strings logic symbol:
    (set-logic S)
-Since the theory of strings is pretty new in CVC4, we are still working on the standards for syntax.
-If you have some comments or suggestions about CVC4 strings, please feel feel to email me: tianyi-liang@uiowa.edu
-==Unsat Core==
-String engine '''does''' support unsat core. To generate unsat cores, you must enable proofs at configure time, and
+==Unsat Cores==
-then run with "--dump-unsat-cores".
+The string solver supports the generation of unsatisfiable core. As wilt other subsolvers though you must enable proofs at configuration time, and
+then run CVC with "--dump-unsat-cores" flag.
 ==Options==
-To use the experimental functions (disabled by default, even in ALL_SUPPORTED mode):
+Some functions in the theory are have only experimental support currently
+and are disabled by default (even in the <code>ALL_SUPPORTED</code> logic:
+To use them:
    (set-option :strings-exp true)
-To use finite model finding mode (false by default):
+The solver can be run in ''finite model finding mode'' which guarantees termination for satisfiable problems. This mode is disabled by default. To enable it:
    (set-option :strings-fmf true)
-The string finite model finding mode is much '''slower''' than the default mode. We highly recommend you '''NOT''' using it if it is not necessary.
+Note that in this mode the solver is much '''slower''' than in default mode. So we recommend it only as a fall back option when the default mode fails to find a solution within a reasonably large timeout.
 To select the strategy of LB rule application: 0-lazy, 1-eager, 2-no (0 by default):
@@ Line 45: / Line 44: @@
    (set-option :strings-alphabet-card n)
 This is a reserved option for the extension of the sequence theory.
+==Alphabet==
+Currently, the solver's theory is based on an alphabet consisting of the 256 characters from (8-bit)Extended ASCII. Since there are several versions of Extended ASCII we allow string constants to contain only ''printable US ASCII characters'', which are encoded in the same way in all Extended ASCII versions.
+'''Note:''' The alphabet will change to the one prescribed by the SMT-LIB standard once there is one.
 ==Printable Characters==
-A ''printable'' character is any character between 0x20 and 0x7e in the standard ASCII table.
+A ''printable'' character is any character with numerical value between 0x20 and 0x7e in the standard US ASCII encoding.
 ==Escape Sequences for String Literals==
+We support escape sequences common in most programming languages to represent non-printable characters.
 {| border="1"
 |-
-| \0 … \9
+| <code>\0</code> … <code>\9</code>
 | represents ASCII character 0 … 9, respectively
 |-
-| \a, \b, \e, \f, \n, \r, \t, \v
+| <code>\a</code>, <code>\b</code>, <code>\e</code>, <code>\f</code>, <code>\n</code>, <code>\r</code>, <code>\t</code>, <code>\v</code>
 | represents its corresponding ASCII character (C++ convention)
 |-

`\0` … `\9`	represents ASCII character 0 … 9, respectively
`\a`, `\b`, `\e`, `\f`, `\n`, `\r`, `\t`, `\v`	represents its corresponding ASCII character (C++ convention)
\ooo	matches an ASCII character, where ooo consists of (no more than) three digits that represent the octal character code (from 0 to 377). For example, \101 represents ‘A’, while “\437” represent a string with two characters “#7”( important ).
\xNN	matches an ASCII character, where NN is a two-digit hexadecimal character code. NN has to be exactly two hex-digits. If not, an exception will be raised.

Difference between revisions of "Strings"

Revision as of 14:07, 9 June 2015

Contents

Syntax

Unsat Cores

Options

Alphabet

Printable Characters

Escape Sequences for String Literals

Strings

Escape Sequences for Regular Expressions

Symbolic Regular Expression

Experimental Mode

Partial Functions

Extension

Limitation

Examples

API

C++

Java

References

Navigation menu

Views

Personal tools

CVC4

For CVC4 Developers

Cascade

Meta

Wiki

Search

Tools