casacore-doc/html/UDFBase_8h_source.html

//# UDFBase.h: Abstract base class for a user-defined TaQL function

//# Copyright (C) 2010

//# Associated Universities, Inc. Washington DC, USA.

//#

//# This library is free software; you can redistribute it and/or modify it

//# under the terms of the GNU Library General Public License as published by

//# the Free Software Foundation; either version 2 of the License, or (at your

//# option) any later version.

//#

//# This library is distributed in the hope that it will be useful, but WITHOUT

//# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or

//# FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Library General Public

//# License for more details.

//#

//# You should have received a copy of the GNU Library General Public License

//# along with this library; if not, write to the Free Software Foundation,

//# Inc., 675 Massachusetts Ave, Cambridge, MA 02139, USA.

//#

//# Correspondence concerning AIPS++ should be addressed as follows:

//#        Internet email: casa-feedback@nrao.edu.

//#        Postal address: AIPS++ Project Office

//#                        National Radio Astronomy Observatory

//#                        520 Edgemont Road

//#                        Charlottesville, VA 22903-2475 USA


#ifndef TABLES_UDFBASE_H

#define TABLES_UDFBASE_H


//# Includes

#include <casacore/casa/aips.h>

#include <casacore/tables/TaQL/ExprNodeRep.h>

#include <casacore/tables/Tables/Table.h>

#include <casacore/tables/TaQL/TaQLStyle.h>

#include <casacore/casa/Containers/Record.h>

#include <casacore/casa/Containers/Block.h>

#include <casacore/casa/stdmap.h>


namespace casacore {


  // <summary>

  // Abstract base class for a user-defined TaQL function

  // </summary>

  //

  // <synopsis>

  // This class makes it possible to add user-defined functions (UDF) to TaQL.

  // A UDF has to be implemented in a class derived from this class and can

  // contain one or more user-defined functions.

  // <br>A few functions have to be implemented in the class as described below.

  // In this way TaQL can be extended with arbitrary functions, which can be

  // normal functions as well as aggregate functions (often used with GROUPBY).

  //

  // A UDF is a class derived from this base class. It must contain the

  // following member functions. See also the example below.

  // <table border=0>

  // <tr>

  //  <td><src>makeObject</src></td>

  //  <td>a static function to create an object of the UDF class. This function

  //    needs to be registered.

  //  </td>

  // </tr>

  // <tr>

  //  <td><src>setup</src></td>

  //  <td>this virtual function is called after the object has been created.

  //   It should initialize the object using the function arguments that

  //   can be obtained using the function <src>operands()</src>. The setup

  //   function should perform the following:

  //   <ul>

  //    <li>Define the data type of the result using <src>setDataType<src>.

  //        The data type should be derived from the data types of the function

  //        arguments. The possible data types are defined in class

  //        TableExprNodeRep.

  //        Note that a UDF can support multiple data types. For example, a

  //        function like <src>min</src> can be used for Int, Double, or a mix.

  //        Function 'checkDT' in class TableExprNodeMulti can be used to

  //        check the data types of the operands and determine the result

  //        data type.

  //    <li>Define if the function is an aggregate function calculating

  //        an aggregated value in a group (e.g., minimum or mean).

  //        <src>setAggregate</src> can be used to tell so.

  //    <li>Define the dimensionality of the result using <src>setNDim</src>.

  //        A value of 0 means a scalar. A value of -1 means an array with

  //        a dimensionality that can vary from row to row.

  //    <li>Optionally use <src>setShape</src> to define the shape if the

  //        results are arrays with a shape that is the same for all rows.

  //        It will also set ndim if setNDim was not used yet, otherwise

  //        it checks if it ndim matches.

  //    <li>Optionally set the unit of the result using <src>setUnit</src>.

  //        TaQL has full support of units, so UDFs should behave the same.

  //        It is possible to change the unit of the function arguments.

  //        For example:

  //        <ul>

  //         <li>a function like 'sin' can force its argument to be

  //          in radians; TaQL will scale the argument as needed. This can be

  //          done like

  //          <src>TableExprNodeUnit::adaptUnit (operands()[i], "rad");</src>

  //         <li>A function like 'asin' will have a result in radians.

  //          Such a UDF should set its result unit to rad.

  //         <li>A function like 'min' wants its arguments to have the same

  //          unit and will set its result unit to it. It can be done like:

  //          <src>setUnit (TableExprFuncNode::makeEqualUnits

  //                        (operands(), 0, operands().size()));</src>

  //        </ul>

  //        See class TableExprFuncNode for more info about these functions.

  //    <li>Optionally define attributes as a Record object. They can be used

  //        by UDFs to tell something more about the type of value.

  //    <li>Optionally define if the result is a constant value using

  //        <src>setConstant</src>. It means that the function is not

  //        dependent on the row number in the table being queried.

  //        This is usually the case if all UDF arguments are constant.

  //   </ul>

  //  </td>

  // </tr>

  // <tr>

  //  <td><src>getXXX</src></td>

  //  <td>these are virtual get functions for each possible data type. The

  //      get functions matching the data types set by the setup

  //      function need to be implemented.

  //      The <src>get</src> functions have an argument TableExprId

  //      defining the table row (or record) for which the function has

  //      to be evaluated.

  //      If the UDF is an aggregate functions the TableExprId has to be

  //      upcasted to an TableExprIdAggr object from which all TableExprId

  //      objects in an aggregation group can be retrieved.

  //      <srcblock>

  //        const TableExprIdAggr& aid = TableExprIdAggr::cast (id);

  //        const vector<TableExprId>& ids = aid.result().ids(id.rownr());

  //      </srcblock>

  //  </td>

  // </tr>

  // </table>

  //

  // A UDF has to be made known to TaQL by adding it to the UDF registry with

  // its name and 'makeObject' function.

  // UDFs will usually reside in a shared library that is loaded dynamically.

  // TaQL will load a UDF in the following way:

  // <ul>

  //  <li> The UDF name used in TaQL consists of two parts: a library name

  //       and a function name separated by a dot. Both parts need to be given.

  //       Note that the library name can also be seen as a UDF scope, so

  //       different UDFs with equal names can be used from different libraries.

  //       A UDF should be registered with this full name.

  //       <br>The "USING STYLE" clause can be used to define a synonym for

  //       a (long) library name in the TaQLStyle object. The library part

  //       of the UDF will always be looked up in this synonym map.

  //  <li> If a UDF is not found in the registry, it will be tried to load

  //       a shared library using the library name part. The libraries tried

  //       to be loaded are lib<library>.so and libcasa_<library>.so.

  //       On Mac .dylib will be tried. If loaded successfully, a special

  //       function 'register_libname' will be called first. It should

  //       register each UDF in the shared library using UDFBase::register.

  // </ul>

  // </synopsis>

  //

  // <example>

  // The following examples show a normal UDF function.

  // <br>It returns True if the function argument matches 1.

  // It can be seen that it checks if the argument is an integer scalar.

  // <srcblock>

  // class TestUDF: public UDFBase

  // {

  // public:

  //   TestUDF() {}

  //   // Registered function to create the UDF object.

  //   // The name of the function is not important here.

  //   static UDFBase* makeObject (const String&)

  //     { return new TestUDF(); }

  //   // Setup and check the details; result is a bool scalar value.

  //   virtual void setup (const Table&, const TaQLStyle&)

  //   {

  //     AlwaysAssert (operands().size() == 1, AipsError);

  //     AlwaysAssert (operands()[0]->dataType() == TableExprNodeRep::NTInt,

  //                   AipsError);

  //     AlwaysAssert (operands()[0]->valueType() == TableExprNodeRep::VTScalar,

  //                   AipsError);

  //     setDataType (TableExprNodeRep::NTBool);

  //     setNDim (0);                                 // scalar result

  //     setConstant (operands()[0].isConstant());    // constant result?

  //   }

  //   // Get the value for the given id.

  //   // It gets the value of the operand and checks if it is 1.

  //   Bool getBool (const TableExprId& id)

  //     { return operands()[0]->getInt(id) == 1; }

  // };

  // </srcblock>

  // </example>


  // <example>

  // The following example shows an aggregate UDF function.

  // It calculates the sum of the cubes of the values in a group.

  // <srcblock>

  // class TestUDFAggr: public UDFBase

  // {

  // public:

  //   TestUDFAggr() {}

  //   // Registered function to create the UDF object.

  //   // The name of the function is not important here.

  //   static UDFBase* makeObject (const String&) { return new TestUDFAggr(); }

  //   // Setup and check the details; result is an integer scalar value.

  //   // It aggregates the values of multiple rows.

  //   virtual void setup (const Table&, const TaQLStyle&)

  //   {

  //     AlwaysAssert (operands().size() == 1, AipsError);

  //     AlwaysAssert (operands()[0]->dataType() == TableExprNodeRep::NTInt, AipsError);

  //     AlwaysAssert (operands()[0]->valueType() == TableExprNodeRep::VTScalar, AipsError);

  //     setDataType (TableExprNodeRep::NTInt);

  //     setNDim (0);           // scalar

  //     setAggregate (True);   // aggregate function

  //   }

  //   // Get the value of a group.

  //   // It aggregates the values of multiple rows.

  //   Int64 getInt (const TableExprId& id)

  //   {

  //     // Cast the id to a TableExprIdAggr object.

  //     const TableExprIdAggr& aid = TableExprIdAggr::cast (id);

  //     // Get the vector of ids for this group.

  //     const vector<TableExprId>& ids = aid.result().ids(id.rownr());

  //     // Get the values for all ids and accumulate them.

  //     Int64 sum3 = 0;

  //     for (vector<TableExprId>::const_iterator it=ids.begin();

  //          it!=ids.end(); ++it){

  //       Int64 v = operands()[0]->getInt(*it);

  //         sum3 += v*v*v;

  //     }

  //     return sum3;

  //   }

  // };

  // </srcblock>

  // </example>

  // More examples of UDF functions can be found in classes UDFMSCal

  // and DirectionUDF.


  class UDFBase

  {

  public:

    // The signature of a global or static member function creating an object

    // of the UDF.

    typedef UDFBase* MakeUDFObject (const String& functionName);


    // Only default constructor is needed.

    UDFBase();


    // Destructor.

    virtual ~UDFBase();


    // Evaluate the function and return the result.

    // Their default implementations throw a "not implemented" exception.

    // <group>

    virtual Bool      getBool     (const TableExprId& id);

    virtual Int64     getInt      (const TableExprId& id);

    virtual Double    getDouble   (const TableExprId& id);

    virtual DComplex  getDComplex (const TableExprId& id);

    virtual String    getString   (const TableExprId& id);

    virtual TaqlRegex getRegex    (const TableExprId& id);

    virtual MVTime    getDate     (const TableExprId& id);

    virtual MArray<Bool>     getArrayBool     (const TableExprId& id);

    virtual MArray<Int64>    getArrayInt      (const TableExprId& id);

    virtual MArray<Double>   getArrayDouble   (const TableExprId& id);

    virtual MArray<DComplex> getArrayDComplex (const TableExprId& id);

    virtual MArray<String>   getArrayString   (const TableExprId& id);

    virtual MArray<MVTime>   getArrayDate     (const TableExprId& id);

    // </group>


    // Get the unit.


    const String& getUnit() const

      { return itsUnit; }


    // Get the attributes.


    const Record& getAttributes() const

      { return itsAttributes; }


    // Flatten the node tree by adding the node and its children to the vector.

    virtual void flattenTree (std::vector<TableExprNodeRep*>&);


  private:

    // Set up the function object.

    virtual void setup (const Table& table,

                        const TaQLStyle&) = 0;


  protected:

    // Get the operands.


    std::vector<TENShPtr>& operands()

      { return itsOperands; }


    // Set the data type.

    // This function must be called by the setup function of the derived class.

    void setDataType (TableExprNodeRep::NodeDataType);


    // Set the dimensionality of the results.

    // <br> 0 means that the results are scalars.

    // <br> -1 means that the results are arrays with unknown dimensionality.

    // <br> >0 means that the results are arrays with that dimensionality.

    // This function must be called by the setup function of the derived class.

    void setNDim (Int ndim);


    // Set the shape of the results if it is fixed and known.

    void setShape (const IPosition& shape);


    // Set the unit of the result.

    // If this function is not called by the setup function of the derived

    // class, the result has no unit.

    void setUnit (const String& unit);


    // Set the attributes of the result.

    // If this function is not called by the setup function of the derived

    // class, the result has no attributes.

    void setAttributes (const Record& attributes);


    // Define if the result is constant (e.g. if all arguments are constant).

    // If this function is not called by the setup function of the derived

    // class, the result is not constant.

    void setConstant (Bool isConstant);


    // Define if the UDF is an aggregate function (usually used in GROUPBY).

    void setAggregate (Bool isAggregate);


    // Let a derived class recreate its column objects in case a selection

    // has to be applied.

    // The default implementation does nothing.

    virtual void recreateColumnObjects (const Vector<rownr_t>& rownrs);


  public:

    // Register the name and construction function of a UDF (thread-safe).

    // An exception is thrown if this name already exists with a different

    // construction function.

    static void registerUDF (const String& name, MakeUDFObject* func);


    // Initialize the function object.

    void init (const std::vector<TENShPtr>& arg,

               const TableExprInfo& tableInfo, const TaQLStyle&);


    // Get the data type.


    TableExprNodeRep::NodeDataType dataType() const

      { return itsDataType; }


    // Get the dimensionality of the results.

    // (0=scalar, -1=array with variable ndim, >0=array with fixed ndim


    Int ndim() const

      { return itsNDim; }


    // Get the result shape if the same for all results.


    const IPosition& shape() const

      { return itsShape; }


    // Tell if the UDF gives a constant result.


    Bool isConstant() const

      { return itsIsConstant; }


    // Tell if the UDF is an aggregate function.


    Bool isAggregate() const

      { return itsIsAggregate; }


    // Do not apply the selection.


    void disableApplySelection()

      { itsApplySelection = False; }


    // If needed, let the UDF re-create column objects for a selection of rows.

    // It calls the function recreateColumnObjects.

    void applySelection (const Vector<rownr_t>& rownrs);


    // Create a UDF object (thread-safe).

    // It looks in the map with fixed function names. If unknown,

    // it looks if a wildcarded function name is supported (for PyTaQL).

    static UDFBase* createUDF (const String& name, const TaQLStyle& style);


  private:

    //# Data members.

    std::vector<TENShPtr>          itsOperands;

    TableExprNodeRep::NodeDataType itsDataType;

    Int                            itsNDim;

    IPosition                      itsShape;

    String                         itsUnit;

    Record                         itsAttributes;

    Bool                           itsIsConstant;

    Bool                           itsIsAggregate;

    Bool                           itsApplySelection;

    //# The registry is used for two purposes:

    //# 1. It is a map of known function names (lib.func) to funcptr.

    //#    Function name * means that the library can contain any function,

    //#    which is intended for python functions (through PyTaQL).

    //# 2. The loaded libraries are kept in the map (with 0 funcptr).

    static map<String, MakeUDFObject*> theirRegistry;

    static std::recursive_mutex theirMutex;

  };


} // end namespace


#endif

casacore::IPosition
Definition IPosition.h:117

casacore::MArray
Definition MArray.h:68

casacore::MVTime
Definition MVTime.h:268

casacore::Record
Definition Record.h:178

casacore::String
String: the storage and methods of handling collections of characters.
Definition String.h:223

casacore::TaQLStyle
Definition TaQLStyle.h:63

casacore::TableExprId
Definition TableExprId.h:95

casacore::TableExprInfo
Class to connect a Table and its alias name.
Definition ExprNodeRep.h:125

casacore::TableExprNodeRep::NodeDataType
NodeDataType
Define the data types of a node.
Definition ExprNodeRep.h:205

casacore::Table
Definition Table.h:157

casacore::TaqlRegex
Definition ExprNodeRep.h:80

casacore::UDFBase
Definition UDFBase.h:234

casacore::UDFBase::getArrayDate
virtual MArray< MVTime > getArrayDate(const TableExprId &id)

casacore::UDFBase::getArrayInt
virtual MArray< Int64 > getArrayInt(const TableExprId &id)

casacore::UDFBase::getDouble
virtual Double getDouble(const TableExprId &id)

casacore::UDFBase::getAttributes
const Record & getAttributes() const
Get the attributes.
Definition UDFBase.h:269

casacore::UDFBase::getUnit
const String & getUnit() const
Get the unit.
Definition UDFBase.h:265

casacore::UDFBase::itsIsAggregate
Bool itsIsAggregate
Definition UDFBase.h:375

casacore::UDFBase::itsShape
IPosition itsShape
Definition UDFBase.h:371

casacore::UDFBase::itsDataType
TableExprNodeRep::NodeDataType itsDataType
Definition UDFBase.h:369

casacore::UDFBase::setAttributes
void setAttributes(const Record &attributes)
Set the attributes of the result.

casacore::UDFBase::init
void init(const std::vector< TENShPtr > &arg, const TableExprInfo &tableInfo, const TaQLStyle &)
Initialize the function object.

casacore::UDFBase::operands
std::vector< TENShPtr > & operands()
Get the operands.
Definition UDFBase.h:282

casacore::UDFBase::setDataType
void setDataType(TableExprNodeRep::NodeDataType)
Set the data type.

casacore::UDFBase::getInt
virtual Int64 getInt(const TableExprId &id)

casacore::UDFBase::dataType
TableExprNodeRep::NodeDataType dataType() const
Get the data type.
Definition UDFBase.h:333

casacore::UDFBase::getDate
virtual MVTime getDate(const TableExprId &id)

casacore::UDFBase::itsApplySelection
Bool itsApplySelection
Definition UDFBase.h:376

casacore::UDFBase::getRegex
virtual TaqlRegex getRegex(const TableExprId &id)

casacore::UDFBase::itsUnit
String itsUnit
Definition UDFBase.h:372

casacore::UDFBase::MakeUDFObject
UDFBase * MakeUDFObject(const String &functionName)
The signature of a global or static member function creating an object of the UDF.
Definition UDFBase.h:238

casacore::UDFBase::applySelection
void applySelection(const Vector< rownr_t > &rownrs)
If needed, let the UDF re-create column objects for a selection of rows.

casacore::UDFBase::itsIsConstant
Bool itsIsConstant
Definition UDFBase.h:374

casacore::UDFBase::ndim
Int ndim() const
Get the dimensionality of the results.
Definition UDFBase.h:338

casacore::UDFBase::setAggregate
void setAggregate(Bool isAggregate)
Define if the UDF is an aggregate function (usually used in GROUPBY).

casacore::UDFBase::isAggregate
Bool isAggregate() const
Tell if the UDF is an aggregate function.
Definition UDFBase.h:350

casacore::UDFBase::setUnit
void setUnit(const String &unit)
Set the unit of the result.

casacore::UDFBase::recreateColumnObjects
virtual void recreateColumnObjects(const Vector< rownr_t > &rownrs)
Let a derived class recreate its column objects in case a selection has to be applied.

casacore::UDFBase::itsOperands
std::vector< TENShPtr > itsOperands
Definition UDFBase.h:368

casacore::UDFBase::getArrayDComplex
virtual MArray< DComplex > getArrayDComplex(const TableExprId &id)

casacore::UDFBase::itsNDim
Int itsNDim
Definition UDFBase.h:370

casacore::UDFBase::UDFBase
UDFBase()
Only default constructor is needed.

casacore::UDFBase::createUDF
static UDFBase * createUDF(const String &name, const TaQLStyle &style)
Create a UDF object (thread-safe).

casacore::UDFBase::getBool
virtual Bool getBool(const TableExprId &id)
Evaluate the function and return the result.

casacore::UDFBase::getDComplex
virtual DComplex getDComplex(const TableExprId &id)

casacore::UDFBase::setConstant
void setConstant(Bool isConstant)
Define if the result is constant (e.g.

casacore::UDFBase::shape
const IPosition & shape() const
Get the result shape if the same for all results.
Definition UDFBase.h:342

casacore::UDFBase::setNDim
void setNDim(Int ndim)
Set the dimensionality of the results.

casacore::UDFBase::flattenTree
virtual void flattenTree(std::vector< TableExprNodeRep * > &)
Flatten the node tree by adding the node and its children to the vector.

casacore::UDFBase::theirMutex
static std::recursive_mutex theirMutex
Definition UDFBase.h:383

casacore::UDFBase::getArrayDouble
virtual MArray< Double > getArrayDouble(const TableExprId &id)

casacore::UDFBase::~UDFBase
virtual ~UDFBase()
Destructor.

casacore::UDFBase::itsAttributes
Record itsAttributes
Definition UDFBase.h:373

casacore::UDFBase::theirRegistry
static map< String, MakeUDFObject * > theirRegistry
Definition UDFBase.h:382

casacore::UDFBase::isConstant
Bool isConstant() const
Tell if the UDF gives a constant result.
Definition UDFBase.h:346

casacore::UDFBase::disableApplySelection
void disableApplySelection()
Do not apply the selection.
Definition UDFBase.h:354

casacore::UDFBase::getString
virtual String getString(const TableExprId &id)

casacore::UDFBase::registerUDF
static void registerUDF(const String &name, MakeUDFObject *func)
Register the name and construction function of a UDF (thread-safe).

casacore::UDFBase::getArrayString
virtual MArray< String > getArrayString(const TableExprId &id)

casacore::UDFBase::setShape
void setShape(const IPosition &shape)
Set the shape of the results if it is fixed and known.

casacore::UDFBase::getArrayBool
virtual MArray< Bool > getArrayBool(const TableExprId &id)

casacore::UDFBase::setup
virtual void setup(const Table &table, const TaQLStyle &)=0
Set up the function object.

casacore::Vector
Definition Vector.h:82

casacore
this file contains all the compiler specific defines
Definition mainpage.dox:28

casacore::False
const Bool False
Definition aipstype.h:42

casacore::Int64
long long Int64
Define the extra non-standard types used by Casacore (like proposed uSize, Size)
Definition aipsxtype.h:36

casacore::Int
int Int
Definition aipstype.h:48

casacore::Bool
bool Bool
Define the standard types used by Casacore.
Definition aipstype.h:40

casacore::Double
double Double
Definition aipstype.h:53