TSTP Solution File: PUZ012_1 by Vampire-SAT---4.8

%------------------------------------------------------------------------------
% File     : Vampire-SAT---4.8
% Problem  : PUZ012_1 : TPTP v8.1.2. Released v5.0.0.
% Transfm  : none
% Format   : tptp:raw
% Command  : vampire --mode casc_sat -m 16384 --cores 7 -t %d %s

% Computer : n020.cluster.edu
% Model    : x86_64 x86_64
% CPU      : Intel(R) Xeon(R) CPU E5-2620 v4 2.10GHz
% Memory   : 8042.1875MB
% OS       : Linux 3.10.0-693.el7.x86_64
% CPULimit : 300s
% WCLimit  : 300s
% DateTime : Sun May  5 08:49:33 EDT 2024

% Result   : Theorem 0.14s 0.38s
% Output   : Refutation 0.14s
% Verified : 
% SZS Type : Refutation
%            Derivation depth      :   11
%            Number of leaves      :   21
% Syntax   : Number of formulae    :   47 (  16 unt;  12 typ;   0 def)
%            Number of atoms       :   62 (   0 equ)
%            Maximal formula atoms :    3 (   1 avg)
%            Number of connectives :   53 (  26   ~;  22   |;   4   &)
%                                         (   0 <=>;   1  =>;   0  <=;   0 <~>)
%            Maximal formula depth :    7 (   3 avg)
%            Maximal term depth    :    1 (   1 avg)
%            Number of types       :    3 (   2 usr)
%            Number of type conns  :    8 (   4   >;   4   *;   0   +;   0  <<)
%            Number of predicates  :    5 (   4 usr;   1 prp; 0-2 aty)
%            Number of functors    :    6 (   6 usr;   6 con; 0-0 aty)
%            Number of variables   :   22 (  22   !;   0   ?;  22   :)

% Comments : 
%------------------------------------------------------------------------------
tff(type_def_5,type,
    box: $tType ).

tff(type_def_6,type,
    fruit: $tType ).

tff(func_def_0,type,
    boxa: box ).

tff(func_def_1,type,
    boxb: box ).

tff(func_def_2,type,
    boxc: box ).

tff(func_def_3,type,
    apples: fruit ).

tff(func_def_4,type,
    bananas: fruit ).

tff(func_def_5,type,
    oranges: fruit ).

tff(pred_def_1,type,
    equal_fruits: ( fruit * fruit ) > $o ).

tff(pred_def_2,type,
    equal_boxes: ( box * box ) > $o ).

tff(pred_def_3,type,
    contains: ( box * fruit ) > $o ).

tff(pred_def_4,type,
    label: ( box * fruit ) > $o ).

tff(f106,plain,
    $false,
    inference(subsumption_resolution,[],[f101,f32]) ).

tff(f32,plain,
    ~ equal_fruits(bananas,oranges),
    inference(cnf_transformation,[],[f12]) ).

tff(f12,axiom,
    ~ equal_fruits(bananas,oranges),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',bananas_not_oranges) ).

tff(f101,plain,
    equal_fruits(bananas,oranges),
    inference(resolution,[],[f93,f85]) ).

tff(f85,plain,
    contains(boxa,bananas),
    inference(subsumption_resolution,[],[f81,f36]) ).

tff(f36,plain,
    ~ equal_fruits(apples,bananas),
    inference(cnf_transformation,[],[f11]) ).

tff(f11,axiom,
    ~ equal_fruits(apples,bananas),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',apples_not_bananas) ).

tff(f81,plain,
    ( equal_fruits(apples,bananas)
    | contains(boxa,bananas) ),
    inference(resolution,[],[f54,f30]) ).

tff(f30,plain,
    contains(boxb,apples),
    inference(cnf_transformation,[],[f17]) ).

tff(f17,axiom,
    contains(boxb,apples),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',boxb_contains_apples) ).

tff(f54,plain,
    ! [X0: fruit] :
      ( ~ contains(boxb,X0)
      | equal_fruits(X0,bananas)
      | contains(boxa,bananas) ),
    inference(resolution,[],[f42,f51]) ).

tff(f51,plain,
    ( contains(boxb,bananas)
    | contains(boxa,bananas) ),
    inference(resolution,[],[f40,f45]) ).

tff(f45,plain,
    ~ contains(boxc,bananas),
    inference(resolution,[],[f41,f28]) ).

tff(f28,plain,
    label(boxc,bananas),
    inference(cnf_transformation,[],[f16]) ).

tff(f16,axiom,
    label(boxc,bananas),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',boxc_labelled_bananas) ).

tff(f41,plain,
    ! [X0: box,X1: fruit] :
      ( ~ label(X0,X1)
      | ~ contains(X0,X1) ),
    inference(cnf_transformation,[],[f21]) ).

tff(f21,plain,
    ! [X0: box,X1: fruit] :
      ( ~ contains(X0,X1)
      | ~ label(X0,X1) ),
    inference(ennf_transformation,[],[f3]) ).

tff(f3,axiom,
    ! [X0: box,X1: fruit] :
      ~ ( contains(X0,X1)
        & label(X0,X1) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',label_is_wrong) ).

tff(f40,plain,
    ! [X0: fruit] :
      ( contains(boxc,X0)
      | contains(boxb,X0)
      | contains(boxa,X0) ),
    inference(cnf_transformation,[],[f4]) ).

tff(f4,axiom,
    ! [X0: fruit] :
      ( contains(boxc,X0)
      | contains(boxb,X0)
      | contains(boxa,X0) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',each_thing_is_in_a_box) ).

tff(f42,plain,
    ! [X2: fruit,X0: box,X1: fruit] :
      ( ~ contains(X0,X2)
      | equal_fruits(X1,X2)
      | ~ contains(X0,X1) ),
    inference(cnf_transformation,[],[f23]) ).

tff(f23,plain,
    ! [X0: box,X1: fruit,X2: fruit] :
      ( equal_fruits(X1,X2)
      | ~ contains(X0,X2)
      | ~ contains(X0,X1) ),
    inference(flattening,[],[f22]) ).

tff(f22,plain,
    ! [X0: box,X1: fruit,X2: fruit] :
      ( equal_fruits(X1,X2)
      | ~ contains(X0,X2)
      | ~ contains(X0,X1) ),
    inference(ennf_transformation,[],[f6]) ).

tff(f6,axiom,
    ! [X0: box,X1: fruit,X2: fruit] :
      ( ( contains(X0,X2)
        & contains(X0,X1) )
     => equal_fruits(X1,X2) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',contains_is_well_defined1) ).

tff(f93,plain,
    ! [X0: fruit] :
      ( ~ contains(boxa,X0)
      | equal_fruits(X0,oranges) ),
    inference(resolution,[],[f86,f42]) ).

tff(f86,plain,
    contains(boxa,oranges),
    inference(resolution,[],[f85,f52]) ).

tff(f52,plain,
    ( ~ contains(boxa,bananas)
    | contains(boxa,oranges) ),
    inference(subsumption_resolution,[],[f50,f46]) ).

tff(f46,plain,
    ~ contains(boxb,oranges),
    inference(resolution,[],[f41,f29]) ).

tff(f29,plain,
    label(boxb,oranges),
    inference(cnf_transformation,[],[f15]) ).

tff(f15,axiom,
    label(boxb,oranges),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',boxb_labelled_oranges) ).

tff(f50,plain,
    ( contains(boxb,oranges)
    | contains(boxa,oranges)
    | ~ contains(boxa,bananas) ),
    inference(resolution,[],[f40,f26]) ).

tff(f26,plain,
    ( ~ contains(boxc,oranges)
    | ~ contains(boxa,bananas) ),
    inference(cnf_transformation,[],[f20]) ).

tff(f20,plain,
    ( ~ contains(boxc,oranges)
    | ~ contains(boxa,bananas) ),
    inference(ennf_transformation,[],[f19]) ).

tff(f19,negated_conjecture,
    ~ ( contains(boxc,oranges)
      & contains(boxa,bananas) ),
    inference(negated_conjecture,[],[f18]) ).

tff(f18,conjecture,
    ( contains(boxc,oranges)
    & contains(boxa,bananas) ),
    file('/export/starexec/sandbox2/benchmark/theBenchmark.p',prove_boxa_contains_bananas_and_boxc_oranges) ).

%------------------------------------------------------------------------------
%----ORIGINAL SYSTEM OUTPUT
% 0.07/0.12  % Problem    : PUZ012_1 : TPTP v8.1.2. Released v5.0.0.
% 0.07/0.14  % Command    : vampire --mode casc_sat -m 16384 --cores 7 -t %d %s
% 0.14/0.36  % Computer : n020.cluster.edu
% 0.14/0.36  % Model    : x86_64 x86_64
% 0.14/0.36  % CPU      : Intel(R) Xeon(R) CPU E5-2620 v4 @ 2.10GHz
% 0.14/0.36  % Memory   : 8042.1875MB
% 0.14/0.36  % OS       : Linux 3.10.0-693.el7.x86_64
% 0.14/0.36  % CPULimit   : 300
% 0.14/0.36  % WCLimit    : 300
% 0.14/0.36  % DateTime   : Fri May  3 18:02:23 EDT 2024
% 0.14/0.36  % CPUTime    : 
% 0.14/0.36  % (26342)Running in auto input_syntax mode. Trying TPTP
% 0.14/0.38  % (26347)fmb+10_1_bce=on:fmbas=expand:fmbksg=on:fmbsr=1.3_569 on theBenchmark for (569ds/0Mi)
% 0.14/0.38  % (26346)fmb+10_1_fmbas=off:fmbsr=1.3:nm=2_1451 on theBenchmark for (1451ds/0Mi)
% 0.14/0.38  % (26348)dis-2_2:3_amm=sco:anc=none:bce=on:fsr=off:gsp=on:nm=16:nwc=1.2:nicw=on:sac=on:sp=weighted_frequency_476 on theBenchmark for (476ds/0Mi)
% 0.14/0.38  % (26351)dis+11_4:5_nm=4_216 on theBenchmark for (216ds/0Mi)
% 0.14/0.38  % (26349)fmb+10_1_bce=on:fmbas=expand:fmbksg=on:fmbsr=1.3:gsp=on:nm=4_470 on theBenchmark for (470ds/0Mi)
% 0.14/0.38  % (26352)fmb+10_1_fmbas=off:fmbsr=1.3:nm=2:si=on:rtra=on:rawr=on:rp=on:fmbksg=on_1451 on theBenchmark for (1451ds/0Mi)
% 0.14/0.38  % (26350)dis+1_20_av=off:lcm=predicate:nm=2:nwc=2.0_396 on theBenchmark for (396ds/0Mi)
% 0.14/0.38  Detected minimum model sizes of [1,1]
% 0.14/0.38  Detected maximum model sizes of [3,3]
% 0.14/0.38  Detected minimum model sizes of [1,1]
% 0.14/0.38  Detected maximum model sizes of [3,3]
% 0.14/0.38  Detected minimum model sizes of [1,1]
% 0.14/0.38  Detected maximum model sizes of [3,3]
% 0.14/0.38  Detected minimum model sizes of [1,1]
% 0.14/0.38  Detected maximum model sizes of [3,3]
% 0.14/0.38  TRYING [1,1]
% 0.14/0.38  TRYING [1,1]
% 0.14/0.38  TRYING [1,2]
% 0.14/0.38  TRYING [1,1]
% 0.14/0.38  TRYING [1,2]
% 0.14/0.38  TRYING [1,3]
% 0.14/0.38  % (26348)Also succeeded, but the first one will report.
% 0.14/0.38  TRYING [1,1]
% 0.14/0.38  % (26350)First to succeed.
% 0.14/0.38  TRYING [1,2]
% 0.14/0.38  TRYING [1,2]
% 0.14/0.38  TRYING [2,2]
% 0.14/0.38  TRYING [2,3]
% 0.14/0.38  % (26351)Also succeeded, but the first one will report.
% 0.14/0.38  TRYING [1,3]
% 0.14/0.38  TRYING [2,2]
% 0.14/0.38  TRYING [3,3]
% 0.14/0.38  TRYING [2,3]
% 0.14/0.38  TRYING [2,3]
% 0.14/0.38  % (26350)Solution written to "/export/starexec/sandbox2/tmp/vampire-proof-26342"
% 0.14/0.38  Cannot enumerate next child to try in an incomplete setup
% 0.14/0.38  % (26346)Refutation not found, incomplete strategy% (26346)------------------------------
% 0.14/0.38  % (26346)Version: Vampire 4.8 (commit 3a798227e on 2024-05-03 07:42:47 +0200)
% 0.14/0.38  % (26346)Termination reason: Refutation not found, incomplete strategy
% 0.14/0.38  
% 0.14/0.38  % (26346)Memory used [KB]: 728
% 0.14/0.38  % (26346)Time elapsed: 0.005 s
% 0.14/0.38  % (26346)Instructions burned: 5 (million)
% 0.14/0.38  TRYING [2,3]
% 0.14/0.38  TRYING [3,3]
% 0.14/0.38  % (26346)------------------------------
% 0.14/0.38  % (26346)------------------------------
% 0.14/0.38  TRYING [3,3]
% 0.14/0.38  Cannot enumerate next child to try in an incomplete setup
% 0.14/0.38  % (26352)Refutation not found, incomplete strategy% (26352)------------------------------
% 0.14/0.38  % (26352)Version: Vampire 4.8 (commit 3a798227e on 2024-05-03 07:42:47 +0200)
% 0.14/0.38  % (26352)Termination reason: Refutation not found, incomplete strategy
% 0.14/0.38  
% 0.14/0.38  % (26352)Memory used [KB]: 732
% 0.14/0.38  % (26352)Time elapsed: 0.005 s
% 0.14/0.38  % (26352)Instructions burned: 5 (million)
% 0.14/0.38  TRYING [3,3]
% 0.14/0.38  % (26350)Refutation found. Thanks to Tanya!
% 0.14/0.38  % SZS status Theorem for theBenchmark
% 0.14/0.38  % SZS output start Proof for theBenchmark
% See solution above
% 0.14/0.38  % (26350)------------------------------
% 0.14/0.38  % (26350)Version: Vampire 4.8 (commit 3a798227e on 2024-05-03 07:42:47 +0200)
% 0.14/0.38  % (26350)Termination reason: Refutation
% 0.14/0.38  
% 0.14/0.38  % (26350)Memory used [KB]: 753
% 0.14/0.38  % (26350)Time elapsed: 0.004 s
% 0.14/0.38  % (26350)Instructions burned: 4 (million)
% 0.14/0.38  % (26342)Success in time 0.02 s
%------------------------------------------------------------------------------