TSTP Solution File: PUZ018-1 by SNARK---20120808r022

View Problem - Process Solution

%------------------------------------------------------------------------------
% File     : SNARK---20120808r022
% Problem  : PUZ018-1 : TPTP v8.1.0. Bugfixed v1.2.0.
% Transfm  : none
% Format   : tptp:raw
% Command  : run-snark %s %d

% Computer : n024.cluster.edu
% Model    : x86_64 x86_64
% CPU      : Intel(R) Xeon(R) CPU E5-2620 v4 2.10GHz
% Memory   : 8042.1875MB
% OS       : Linux 3.10.0-693.el7.x86_64
% CPULimit : 300s
% WCLimit  : 600s
% DateTime : Mon Jul 18 18:26:44 EDT 2022

% Result   : Unsatisfiable 0.20s 0.52s
% Output   : Refutation 0.20s
% Verified : 
% SZS Type : Refutation
%            Derivation depth      :    8
%            Number of leaves      :   23
% Syntax   : Number of clauses     :   41 (  29 unt;   8 nHn;  40 RR)
%            Number of literals    :   76 (   0 equ;  27 neg)
%            Maximal clause size   :    7 (   1 avg)
%            Maximal term depth    :    1 (   1 avg)
%            Number of predicates  :    6 (   5 usr;   1 prp; 0-2 aty)
%            Number of functors    :   10 (  10 usr;  10 con; 0-0 aty)
%            Number of variables   :   12 (   1 sgn)

% Comments : 
%------------------------------------------------------------------------------
cnf(all_on_a_on,axiom,
    ( ~ all_on(X)
    | on(a,X) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',all_on_a_on) ).

cnf(all_on_b_on,axiom,
    ( ~ all_on(X)
    | on(b,X) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',all_on_b_on) ).

cnf(all_on_c_on,axiom,
    ( ~ all_on(X)
    | on(c,X) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',all_on_c_on) ).

cnf(monday_follows_sunday,axiom,
    consecutive(sunday,monday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',monday_follows_sunday) ).

cnf(tuesday_follows_monday,axiom,
    consecutive(monday,tuesday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',tuesday_follows_monday) ).

cnf(wednesday_follows_tuesday,axiom,
    consecutive(tuesday,wednesday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',wednesday_follows_tuesday) ).

cnf(thursday_follows_wednesday,axiom,
    consecutive(wednesday,thursday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',thursday_follows_wednesday) ).

cnf(friday_follows_thursday,axiom,
    consecutive(thursday,friday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',friday_follows_thursday) ).

cnf(a_not_b,axiom,
    ~ same_person(a,b),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',a_not_b) ).

cnf(a_not_c,axiom,
    ~ same_person(a,c),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',a_not_c) ).

cnf(sunday_not_tuesday,axiom,
    ~ same_day(sunday,tuesday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',sunday_not_tuesday) ).

cnf(sunday_not_thursday,axiom,
    ~ same_day(sunday,thursday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',sunday_not_thursday) ).

cnf(tuesday_not_thursday,axiom,
    ~ same_day(tuesday,thursday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',tuesday_not_thursday) ).

cnf(all_on_one_day,hypothesis,
    ( all_on(sunday)
    | all_on(monday)
    | all_on(tuesday)
    | all_on(wednesday)
    | all_on(thursday)
    | all_on(friday)
    | all_on(saturday) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',all_on_one_day) ).

cnf(not_on_for_3_days,hypothesis,
    ( ~ consecutive(X,Y)
    | ~ consecutive(Y,Z)
    | ~ consecutive(Z,U)
    | ~ on(V,X)
    | ~ on(V,Y)
    | ~ on(V,Z) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',not_on_for_3_days) ).

cnf(no_two_off_twice_together,hypothesis,
    ( on(X,Y)
    | on(X,Z)
    | on(U,Y)
    | on(U,Z)
    | same_person(X,U)
    | same_day(Y,Z) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',no_two_off_twice_together) ).

cnf(a_off_sunday,hypothesis,
    ~ on(a,sunday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',a_off_sunday) ).

cnf(a_off_tuesday,hypothesis,
    ~ on(a,tuesday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',a_off_tuesday) ).

cnf(a_off_thursday,hypothesis,
    ~ on(a,thursday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',a_off_thursday) ).

cnf(b_off_thursday,hypothesis,
    ~ on(b,thursday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',b_off_thursday) ).

cnf(b_off_saturday,hypothesis,
    ~ on(b,saturday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',b_off_saturday) ).

cnf(c_off_sunday,hypothesis,
    ~ on(c,sunday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',c_off_sunday) ).

cnf(prove_all_on_friday,negated_conjecture,
    ~ all_on(friday),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',prove_all_on_friday) ).

cnf(49,plain,
    ( all_on(sunday)
    | all_on(monday)
    | all_on(tuesday)
    | all_on(wednesday)
    | all_on(thursday)
    | all_on(saturday) ),
    inference('REWRITE',[status(thm)],[all_on_one_day,prove_all_on_friday]) ).

cnf(50,plain,
    ~ all_on(sunday),
    inference('UR-RESOLVE',[status(thm)],[all_on_a_on,a_off_sunday]) ).

cnf(51,plain,
    ( all_on(monday)
    | all_on(tuesday)
    | all_on(wednesday)
    | all_on(thursday)
    | all_on(saturday) ),
    inference('REWRITE',[status(thm)],[49,50]) ).

cnf(52,plain,
    ~ all_on(tuesday),
    inference('UR-RESOLVE',[status(thm)],[all_on_a_on,a_off_tuesday]) ).

cnf(53,plain,
    ( all_on(monday)
    | all_on(wednesday)
    | all_on(thursday)
    | all_on(saturday) ),
    inference('REWRITE',[status(thm)],[51,52]) ).

cnf(54,plain,
    ~ all_on(thursday),
    inference('UR-RESOLVE',[status(thm)],[all_on_a_on,a_off_thursday]) ).

cnf(55,plain,
    ( all_on(monday)
    | all_on(wednesday)
    | all_on(saturday) ),
    inference('REWRITE',[status(thm)],[53,54]) ).

cnf(56,plain,
    ~ all_on(saturday),
    inference('UR-RESOLVE',[status(thm)],[all_on_b_on,b_off_saturday]) ).

cnf(57,plain,
    ( all_on(monday)
    | all_on(wednesday) ),
    inference('REWRITE',[status(thm)],[55,56]) ).

cnf(60,plain,
    ( all_on(monday)
    | on(c,wednesday) ),
    inference('HYPERRESOLVE',[status(thm)],[all_on_c_on,57]) ).

cnf(62,plain,
    on(b,tuesday),
    inference('UR-RESOLVE',[status(thm)],[no_two_off_twice_together,a_off_tuesday,a_off_thursday,b_off_thursday,a_not_b,tuesday_not_thursday]) ).

cnf(63,plain,
    on(c,tuesday),
    inference('UR-RESOLVE',[status(thm)],[no_two_off_twice_together,a_off_sunday,a_off_tuesday,c_off_sunday,a_not_c,sunday_not_tuesday]) ).

cnf(64,plain,
    on(b,sunday),
    inference('UR-RESOLVE',[status(thm)],[no_two_off_twice_together,a_off_sunday,a_off_thursday,b_off_thursday,a_not_b,sunday_not_thursday]) ).

cnf(65,plain,
    on(c,thursday),
    inference('UR-RESOLVE',[status(thm)],[no_two_off_twice_together,a_off_sunday,a_off_thursday,c_off_sunday,a_not_c,sunday_not_thursday]) ).

cnf(72,plain,
    ~ on(b,monday),
    inference('UR-RESOLVE',[status(thm)],[not_on_for_3_days,64,monday_follows_sunday,tuesday_follows_monday,wednesday_follows_tuesday,62]) ).

cnf(74,plain,
    ~ on(c,wednesday),
    inference('UR-RESOLVE',[status(thm)],[not_on_for_3_days,65,wednesday_follows_tuesday,thursday_follows_wednesday,friday_follows_thursday,63]) ).

cnf(75,plain,
    all_on(monday),
    inference('REWRITE',[status(thm)],[60,74]) ).

cnf(78,plain,
    $false,
    inference('REWRITE',[status(thm)],[inference('HYPERRESOLVE',[status(thm)],[all_on_b_on,75]),72]) ).

%------------------------------------------------------------------------------
%----ORIGINAL SYSTEM OUTPUT
% 0.07/0.12  % Problem  : PUZ018-1 : TPTP v8.1.0. Bugfixed v1.2.0.
% 0.07/0.13  % Command  : run-snark %s %d
% 0.12/0.34  % Computer : n024.cluster.edu
% 0.12/0.34  % Model    : x86_64 x86_64
% 0.12/0.34  % CPU      : Intel(R) Xeon(R) CPU E5-2620 v4 @ 2.10GHz
% 0.12/0.34  % Memory   : 8042.1875MB
% 0.12/0.34  % OS       : Linux 3.10.0-693.el7.x86_64
% 0.12/0.34  % CPULimit : 300
% 0.12/0.34  % WCLimit  : 600
% 0.12/0.34  % DateTime : Sun May 29 00:33:36 EDT 2022
% 0.12/0.34  % CPUTime  : 
% 0.20/0.46  /export/starexec/sandbox2/benchmark/theBenchmark.p
% 0.20/0.47  * 
% 0.20/0.47  * 
% 0.20/0.47  #<PACKAGE "SNARK-USER">
% 0.20/0.47  * 
% 0.20/0.47  SNARK-TPTP-OPTIONS
% 0.20/0.47  * 
% 0.20/0.47  ((AGENDA-LENGTH-LIMIT NIL) (AGENDA-LENGTH-BEFORE-SIMPLIFICATION-LIMIT NIL)
% 0.20/0.47   (USE-HYPERRESOLUTION T) (USE-UR-RESOLUTION T) (USE-PARAMODULATION T)
% 0.20/0.47   (USE-FACTORING :POS)
% 0.20/0.47   (USE-LITERAL-ORDERING-WITH-HYPERRESOLUTION 'LITERAL-ORDERING-P)
% 0.20/0.47   (USE-LITERAL-ORDERING-WITH-PARAMODULATION 'LITERAL-ORDERING-P)
% 0.20/0.47   (ORDERING-FUNCTIONS>CONSTANTS T) (ASSERT-CONTEXT :CURRENT)
% 0.20/0.47   (RUN-TIME-LIMIT 300) (LISTEN-FOR-COMMANDS NIL)
% 0.20/0.47   (USE-CLOSURE-WHEN-SATISFIABLE T) (PRINT-ROWS-WHEN-GIVEN NIL)
% 0.20/0.47   (PRINT-ROWS-WHEN-DERIVED NIL) (PRINT-UNORIENTABLE-ROWS NIL)
% 0.20/0.47   (PRINT-ROW-WFFS-PRETTILY NIL) (PRINT-FINAL-ROWS :TPTP)
% 0.20/0.47   (PRINT-OPTIONS-WHEN-STARTING NIL) (USE-VARIABLE-NAME-SORTS NIL)
% 0.20/0.47   (USE-PURITY-TEST T) (USE-RELEVANCE-TEST T) (DECLARE-TPTP-SYMBOLS1)
% 0.20/0.47   (DECLARE-TPTP-SYMBOLS2))
% 0.20/0.47  * 
% 0.20/0.47  "."
% 0.20/0.47  * 
% 0.20/0.47  ; Begin refute-file /export/starexec/sandbox2/benchmark/theBenchmark.p 2022-05-29T00:33:37
% 0.20/0.47  ; Running SNARK from /davis/home/graph/tptp/Systems/SNARK---20120808r022/Source/snark-system.lisp in SBCL 1.0.12 on n024.cluster.edu at 2022-05-29T00:33:37
% 0.20/0.52  
% 0.20/0.52  
% 0.20/0.52  #||
% 0.20/0.52  % SZS status Unsatisfiable for /export/starexec/sandbox2/benchmark/theBenchmark.p
% 0.20/0.52  % SZS output start Refutation
% See solution above
% 0.20/0.52  ||#
% 0.20/0.52  
% 0.20/0.52  ; Summary of computation:
% 0.20/0.52  ;       133 formulas have been input or derived (from 59 formulas).
% 0.20/0.52  ;        78 (59%) were retained.  Of these,
% 0.20/0.52  ;            9 (12%) were simplified or subsumed later,
% 0.20/0.52  ;           69 (88%) are still being kept.
% 0.20/0.52  ; 
% 0.20/0.52  ; Run time in seconds excluding printing time:
% 0.20/0.52  ;     0.005  11%   Read assertion file          (1 call)
% 0.20/0.52  ;     0.001   2%   Assert                       (48 calls)
% 0.20/0.52  ;     0.003   7%   Process new row              (102 calls)
% 0.20/0.52  ;     0.007  15%   Resolution                   (116 calls)
% 0.20/0.52  ;     0.000   0%   Paramodulation               (58 calls)
% 0.20/0.52  ;     0.000   0%   Factoring                    (2 calls)
% 0.20/0.52  ;     0.001   2%   Condensing                   (19 calls)
% 0.36/0.52  ;     0.001   2%   Forward subsumption          (19 calls)
% 0.36/0.52  ;     0.000   0%   Backward subsumption         (19 calls)
% 0.36/0.52  ;     0.002   4%   Forward simplification       (102 calls)
% 0.36/0.52  ;     0.002   4%   Backward simplification      (78 calls)
% 0.36/0.52  ;     0.000   0%   Ordering                     (81 calls)
% 0.36/0.52  ;     0.001   2%   Sortal reasoning             (32 calls)
% 0.36/0.52  ;     0.000   0%   Purity testing               (1 call)
% 0.36/0.52  ;     0.023  50%   Other
% 0.36/0.52  ;     0.046        Total
% 0.36/0.52  ;     0.049        Real time
% 0.36/0.52  ; 
% 0.36/0.52  ; Term-hash-array has 81 terms in all.
% 0.36/0.52  ; Feature-vector-row-index has 10 entries (14 at peak, 19 added, 9 deleted).
% 0.36/0.52  ; Feature-vector-row-index has 28 nodes (39 at peak, 74 added, 46 deleted).
% 0.36/0.52  ;  Retrieved 0 possibly forward subsuming rows in 19 calls.
% 0.36/0.52  ;  Retrieved 0 possibly backward subsumed rows in 19 calls.
% 0.36/0.52  ; Path-index has 89 entries (90 at peak, 112 added, 23 deleted).
% 0.36/0.52  ; Path-index has 79 nodes (79 at peak, 100 added, 21 deleted).
% 0.36/0.52  ; Trie-index has 89 entries (90 at peak, 112 added, 23 deleted).
% 0.36/0.52  ; Trie-index has 102 nodes (103 at peak, 125 added, 23 deleted).
% 0.36/0.52  ; Retrieved 60 generalization terms in 141 calls.
% 0.36/0.52  ; Retrieved 59 instance terms in 58 calls.
% 0.36/0.52  ; Retrieved 5,293 unifiable terms in 1,427 calls.
% 0.36/0.52  ; 
% 0.36/0.52  ; The agenda of rows to process has 6 entries:
% 0.36/0.52  ;     6 with value 6
% 0.36/0.52  ; The agenda of rows to give has 11 entries:
% 0.36/0.52  ;     1 with value (4 5)           7 with value (4 6)            3 with value (4 21)
% 0.36/0.52  Evaluation took:
% 0.36/0.52    0.05 seconds of real time
% 0.36/0.52    0.042458 seconds of user run time
% 0.36/0.52    0.007237 seconds of system run time
% 0.36/0.52    0 calls to %EVAL
% 0.36/0.52    0 page faults and
% 0.36/0.52    4,294,952 bytes consed.
% 0.36/0.52  :PROOF-FOUND
% 0.36/0.52  ; End refute-file /export/starexec/sandbox2/benchmark/theBenchmark.p 2022-05-29T00:33:37
% 0.36/0.52  :PROOF-FOUND
% 0.36/0.52  * 
%------------------------------------------------------------------------------