Rik Schaaf created OPENJPA-2920:
-----------------------------------

             Summary: CriteriaBuilder generating suboptimal code
                 Key: OPENJPA-2920
                 URL: https://issues.apache.org/jira/browse/OPENJPA-2920
             Project: OpenJPA
          Issue Type: Bug
          Components: criteria
    Affects Versions: 3.2.0
            Reporter: Rik Schaaf


*Background:*

I have the following entity:


{code:java}
package com.github.cc007.headsplugin.integration.database.entities;

import lombok.AccessLevel;
import lombok.Getter;
import lombok.NoArgsConstructor;
import lombok.Setter;
import lombok.ToString;

import javax.persistence.CascadeType;
import javax.persistence.Column;
import javax.persistence.Entity;
import javax.persistence.FetchType;
import javax.persistence.GeneratedValue;
import javax.persistence.GenerationType;
import javax.persistence.Id;
import javax.persistence.Index;
import javax.persistence.ManyToMany;
import javax.persistence.Table;
import javax.persistence.Version;
import java.util.Collections;
import java.util.HashSet;
import java.util.Set;

@Entity
@Table(name = "heads",
        indexes = {
                @Index(name = "heads_headowner_index", columnList = 
"headOwner"),
                @Index(name = "heads_name_index", columnList = "name")
        }
)
@Getter
@Setter
@ToString
@NoArgsConstructor
public class HeadEntity {

    @Id
    @Column(name = "id", nullable = false)
    @GeneratedValue(strategy = GenerationType.AUTO)
    @Setter(AccessLevel.NONE)
    private long id;

    @Version
    @Column(name = "version", nullable = false)
    private long version;

    @Column(name = "headOwner", unique = true, nullable = false)
    private String headOwner;

    @Column(name = "name", nullable = false)
    private String name;

    @Column(name = "value", length = 1023, nullable = false)
    private String value;

    @ToString.Exclude
    @ManyToMany(
            fetch = FetchType.EAGER,
            cascade = {CascadeType.PERSIST, CascadeType.MERGE},
            mappedBy = "heads"
    )
    @Getter(AccessLevel.NONE)
    @Setter(AccessLevel.NONE)
    private Set<DatabaseEntity> databases = new HashSet<>();

    @ToString.Exclude
    @ManyToMany(
            fetch = FetchType.EAGER,
            cascade = {CascadeType.PERSIST, CascadeType.MERGE},
            mappedBy = "heads"
    )
    @Getter(AccessLevel.NONE)
    @Setter(AccessLevel.NONE)
    private Set<TagEntity> tags = new HashSet<>();

    @ToString.Exclude
    @ManyToMany(
            fetch = FetchType.EAGER,
            cascade = {CascadeType.PERSIST, CascadeType.MERGE},
            mappedBy = "heads"
    )
    @Getter(AccessLevel.NONE)
    @Setter(AccessLevel.NONE)
    private Set<CategoryEntity> categories = new HashSet<>();

    @ToString.Exclude
    @ManyToMany(
            fetch = FetchType.LAZY,
            cascade = {CascadeType.PERSIST, CascadeType.MERGE},
            mappedBy = "heads"
    )
    @Getter(AccessLevel.NONE)
    @Setter(AccessLevel.NONE)
    private Set<SearchEntity> searches = new HashSet<>();

    public Set<DatabaseEntity> getDatabases() {
        return Collections.unmodifiableSet(databases);
    }

    public Set<TagEntity> getTags() {
        return Collections.unmodifiableSet(tags);
    }

    public Set<CategoryEntity> getCategories() {
        return Collections.unmodifiableSet(categories);
    }

    public Set<SearchEntity> getSearches() {
        return Collections.unmodifiableSet(searches);
    }
} {code}
Note the  {{{}unique = true{}}}, {{nullable = false}} (and the 
{{{}heads_headowner_index{}}})

I have created a couple of functions using a CriteriaBuilder:


{code:java}
public List<String> findAllHeadOwnersByHeadOwnerIn(Collection<String> 
headOwners) {
    final var resultList = new ArrayList<String>();
    final var headOwnerGroups = CollectionUtils.partitionCollection(headOwners, 
configProperties.getDatabase().getChunkSize());
    for (final var headOwnerGroup : headOwnerGroups) {
        final var query = querySelectionByCondition(HeadEntity.class,
                root -> root.get("headOwner"), String.class,
                (criteriaBuilder, root) -> 
root.get("headOwner").in(headOwnerGroup)
        );
        resultList.addAll(query.getResultList());
    }
    return resultList;
}

public <E, T> TypedQuery<T> querySelectionByCondition(
        Class<E> entityType,
        Function<Root<E>, Path<T>> selection,
        Class<T> selectPropertyType,
        BiFunction<CriteriaBuilder, Root<E>, Predicate> whereCondition
) {
    final var criteriaBuilder = entityManager.getCriteriaBuilder();

    final var criteriaQuery = criteriaBuilder
            .createQuery(selectPropertyType);

    final var root = criteriaQuery.from(entityType);

    
criteriaQuery.select(selection.apply(root)).where(whereCondition.apply(criteriaBuilder,
 root));

    return entityManager.createQuery(criteriaQuery);
}

public <E> Optional<E> getSingleResult(TypedQuery<E> query) {
    try {
        return Optional.of(query.getSingleResult());
    } catch (NoResultException e) {
        return Optional.empty();
    }
}

public <T> List<T> getMutableResultList(TypedQuery<T> query) {
    return new ArrayList<>(query.getResultList());
} {code}
 

Note the {{root.get("headOwner").in(headOwnerGroup)}} that is used in the 
{{findAllHeadOwnersByHeadOwnerIn}} function.
(FYI: I use a chunksize of 500, because it was causing issues in the past when 
I didn't partition or used anything above 1000).

*Expectation:*

When I run code that uses this, I would expect it to generate a {{SELECT 
h.headOwner FROM heads h WHERE h.headowner IN (...);}} 

*Actual behavior*

The resulting typed query is this: 


{code:java}
SELECT t0.headOwner FROM heads t0 
WHERE (
 (
     t0.headOwner = ?
  OR t0.headOwner = ?
  OR t0.headOwner = ?
  OR t0.headOwner = ?

  -- in total 500 t0.headOwner comparisons

  OR t0.headOwner = ?
  OR t0.headOwner = ?
  OR t0.headOwner = ?
 ) 
 AND t0.headOwner IS NOT NULL
) {code}
Note the {{AND t0.headOwner IS NOT NULL}} even though headOwner is not nullable.

In a database with 50000-ish rows, this query takes about 1500-2500ms to 
complete.
If I ran the query, without the AND statement, so:


{code:java}
SELECT t0.headOwner FROM heads t0 
WHERE (
 (
     t0.headOwner = ?
  OR t0.headOwner = ?
  OR t0.headOwner = ?

-- in total 500 t0.headOwner comparisons

  OR t0.headOwner = ?
  OR t0.headOwner = ?
  OR t0.headOwner = ?
 ) 
 -- without the AND t0.headOwner IS NOT NULL
){code}
This query only takes 150ms to complete.
If I were to use {{SELECT h.headOwner FROM heads h WHERE h.headowner IN 
(...);}} with 500 values in the {{IN()}} expression, then it only takes 80-100ms

*Versions:*
 * OpenJPA: 3.2.0
 * HSQLDB: 2.7.1
 * Java: OpenJDK 17.0.2

*Config:*
**
{code:java}
<?xml version="1.0" encoding="UTF-8"?>
<persistence version="2.1"
             xmlns="http://xmlns.jcp.org/xml/ns/persistence";
             xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance";
             xsi:schemaLocation="http://xmlns.jcp.org/xml/ns/persistence 
http://xmlns.jcp.org/xml/ns/persistence/persistence_2_1.xsd";>
  <persistence-unit name="default" transaction-type="RESOURCE_LOCAL">
    <provider>org.apache.openjpa.persistence.PersistenceProviderImpl</provider>
    
<class>com.github.cc007.headsplugin.integration.database.entities.CategoryEntity</class>
    
<class>com.github.cc007.headsplugin.integration.database.entities.DatabaseEntity</class>
    
<class>com.github.cc007.headsplugin.integration.database.entities.HeadEntity</class>
    
<class>com.github.cc007.headsplugin.integration.database.entities.SearchEntity</class>
    
<class>com.github.cc007.headsplugin.integration.database.entities.TagEntity</class>
    <exclude-unlisted-classes>true</exclude-unlisted-classes>
    <properties>
      <property name="openjpa.jdbc.SynchronizeMappings" 
value="buildSchema(SchemaAction='add', ForeignKeys=true)"/>
      <property name="openjpa.ConnectionURL" 
value="jdbc:hsqldb:file:plugins/HeadsPluginAPI/data/heads;hsqldb.lock_file=false"/>
      <property name="openjpa.ConnectionDriverName" 
value="org.hsqldb.jdbcDriver"/>
      <property name="openjpa.ConnectionUserName" value="sa"/>
      <property name="openjpa.ConnectionPassword" value=""/>
<!--      <property name="openjpa.Log" value="DefaultLevel=WARN, Tool=INFO"/>-->
      <property name="openjpa.Log" value="DefaultLevel=WARN, Tool=INFO, 
SQL=TRACE"/>
    </properties>
  </persistence-unit>
</persistence> {code}
 

 



--
This message was sent by Atlassian Jira
(v8.20.10#820010)

Reply via email to