0% found this document useful (0 votes)

64 views12 pages

Vector Search Demo Commands

Uploaded by

suchindran kannan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

64 views12 pages

Vector Search Demo Commands

Uploaded by

suchindran kannan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 12

@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@

@@@@@@@@@@@
COMMANDS
@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@
@@@@@@@@@@@

===================================================
Sample Table Creation With Vector Datatype:
===================================================

CREATE TABLE house_for_sale (house_id NUMBER,

price NUMBER,
city VARCHAR2(400),
house_photo BLOB,
house_vector VECTOR);

===================================================================================
DEMO TO ILLUSTRATE THE WORKFLOW OF VECTOR SEARCH ARCHITECTURE USING PDF DOCUMENTS
===================================================================================

1. Create Tablespace, DB User and Grant privileges

~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

$ sqlplus sys/<passwd>@<pdb_service_name> as sysdba

SQL> CREATE TABLESPACE tbs1 DATAFILE 'tbs5.dbf' SIZE 5G AUTOEXTEND ON EXTENT

MANAGEMENT LOCAL SEGMENT SPACE MANAGEMENT AUTO;

SQL> drop user vector cascade;

SQL> create user vector identified by vector DEFAULT TABLESPACE tbs1 quota
unlimited on tbs1;
SQL> grant DB_DEVELOPER_ROLE to vector;

SQL> create or replace directory VEC_DUMP as '/tmp/my_local_dir/';

SQL> grant read, write on directory vec_dump to vector;

2. Load your embedding model into the Oracle Database

~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

Using the DBMS_VECTOR package, load your embedding model into the Oracle Database.
You must specify the directory where you stored your model in ONNX format as well
as describe what type of model it is and how you want to use it.

$ sqlplus vector/<passwd>@<pdb_service_name>

Syntax: exec dbms_vector.drop_onnx_model(model_name =>

'<user_specified_model_name>', force => true);
Syntax: exec dbms_vector.load_onnx_model(directory => '<db_directory_name>',
filename => '<onnx_format_embedding_file>', model_name =>
'<user_specified_name_for_this_model>', metadata =>
'<A_JSON_description_of_the_metadata_describing_the_model>');

Note:
At minimum, the JSON metadata must describe the machine learning 'function'
supported by the model.

SQL> exec dbms_vector.drop_onnx_model(model_name => 'doc_model', force => true);

SQL> exec dbms_vector.load_onnx_model('VEC_DUMP', 'my_embedding_model.onnx',
'doc_model', JSON('{"function" : "embedding", "embeddingOutput" : "embedding" ,
"input":{"input": ["DATA"]}}'));
or
SQL> exec dbms_data_mining.import_onnx_model('my_embedding_model.onnx',
'doc_model', JSON('{"function" : "embedding", "embeddingOutput" : "embedding" ,
"input":{"input": ["DATA"]}}'));

3. Create a relational table to store books in the PDF format

~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

SQL> drop table documentation_tab purge;

SQL> create table documentation_tab (id number, data blob);
SQL> insert into documentation_tab values(1, to_blob(bfilename('VEC_DUMP',
'database-concepts23ai.pdf')));
SQL> insert into documentation_tab values(2, to_blob(bfilename('VEC_DUMP', 'oracle-
ai-vector-search-users-guide.pdf')));
SQL> commit;
SQL> select dbms_lob.getlength(data) from documentation_tab;

4. Create a relational table to store unstructured data chunks and associated

vector embeddings
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
~~~~~~~~~~~~

SQL> drop table doc_chunks purge;

SQL> create table doc_chunks (doc_id number, chunk_id number, chunk_data
varchar2(4000), chunk_embedding vector);

SQL>
insert into doc_chunks
select dt.id doc_id, et.embed_id chunk_id, et.embed_data chunk_data,
to_vector(et.embed_vector) chunk_embedding
from
documentation_tab dt,
dbms_vector_chain.utl_to_embeddings(
dbms_vector_chain.utl_to_chunks(dbms_vector_chain.utl_to_text(dt.data),
json('{"normalize":"all"}')),
json('{"provider":"database", "model":"doc_model"}')) t,
JSON_TABLE(t.column_value, '$[*]' COLUMNS (embed_id NUMBER PATH '$.embed_id',
embed_data VARCHAR2(4000) PATH '$.embed_data', embed_vector CLOB PATH
'$.embed_vector')) et;

SQL> commit;

Syntax for DBMS_VECTOR_CHAIN.UTL_TO_EMBEDDINGS: -- Converts data to one or more

vector embeddings
------------------------------------------------
DBMS_VECTOR_CHAIN.UTL_TO_EMBEDDINGS (
DATA IN VECTOR_ARRAY_T,
PARAMS IN JSON default NULL
) return VECTOR_ARRAY_T;

Syntax for DBMS_VECTOR_CHAIN.UTL_TO_CHUNKS: -- Splits data into smaller pieces or

chunks
-------------------------------------------
DBMS_VECTOR_CHAIN.UTL_TO_CHUNKS (
DATA IN CLOB | VARCHAR2
PARAMS IN JSON default NULL
) return VECTOR_ARRAY_T;

Syntax for DBMS_VECTOR_CHAIN.UTL_TO_TEXT: -- Extracts plain text data from

documents
-----------------------------------------
DBMS_VECTOR_CHAIN.UTL_TO_TEXT (
DATA IN CLOB | BLOB,
PARAMS IN JSON default NULL
) return CLOB;

5. Generate a query vector for use in a similarity search

~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

For a similarity search you will need query vectors. Here you enter your query text
and generate an associated vector embedding.

SQL> ACCEPT text_input CHAR PROMPT 'Enter text: '

Type: "different methods of backup and recovery"

SQL> VARIABLE text_variable VARCHAR2(1000)

SQL> VARIABLE query_vector VECTOR
SQL>
BEGIN
:text_variable := '&text_input';
SELECT vector_embedding(doc_model using :text_variable as data)
into :query_vector;
END;
/

PRINT query_vector

6. Run a similarity search to find, within your books, the first four most relevant
chunks that talk about backup and recovery
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
Using the generated query vector, you search similar chunks in the DOC_CHUNKS
table. For this, you use the VECTOR_DISTANCE SQL function and the FETCH SQL clause
to retrieve the most similar chunks.

SELECT doc_id, chunk_id, chunk_data

FROM doc_chunks
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH FIRST 4 ROWS ONLY;

SELECT doc_id, chunk_id, chunk_data

FROM doc_chunks
WHERE doc_id=1
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH FIRST 4 ROWS ONLY;

EXPLAIN PLAN FOR

SELECT doc_id, chunk_id, chunk_data
FROM doc_chunks
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH FIRST 4 ROWS ONLY;
select plan_table_output from table(dbms_xplan.display('plan_table',null,'all'));

7. Run a multi-vector similarity search to find, within your books, the first four
most relevant chunks in the first two most relevant books.
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

SELECT doc_id, chunk_id, chunk_data

FROM doc_chunks
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH FIRST 2 PARTITIONS BY doc_id, 4 ROWS ONLY;

8. Create an In-Memory Neighbor Graph Vector Index on the vector embeddings that
you created
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
~~~~~~~~~~
When dealing with huge vector embedding spaces, you may want to create vector
indexes to accelerate your similarity searches.
Instead of scanning each and every vector embedding in your table, a vector index
uses heuristics to reduce the search space
to accelerate the similarity search. This is called approximate similarity search.

create vector index docs_hnsw_idx on doc_chunks(chunk_embedding)

organization inmemory neighbor graph
distance COSINE
with target accuracy 95;

SQL> SELECT INDEX_NAME, INDEX_TYPE, INDEX_SUBTYPE FROM USER_INDEXES;

INDEX_NAME INDEX_TYPE INDEX_SUBTYPE

-------------- ----------- -----------------------------
DOCS_HNSW_IDX VECTOR INMEMORY_NEIGHBOR_GRAPH_HNSW

SELECT JSON_SERIALIZE(IDX_PARAMS returning varchar2 PRETTY) FROM

VECSYS.VECTOR$INDEX where IDX_NAME = 'DOCS_HNSW_IDX';

JSON_SERIALIZE(IDX_PARAMSRETURNINGVARCHAR2PRETTY)
________________________________________________________________
{
"type" : "HNSW",
"num_neighbors" : 32,
"efConstruction" : 300,
"distance" : "COSINE",
"accuracy" : 95,
"vector_type" : "FLOAT32",
"vector_dimension" : 384,
"degree_of_parallelism" : 1,
"pdb_id" : 3,
"indexed_col" : "CHUNK_EMBEDDING"
}

9. Determine the memory allocation in the vector memory area

~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

To get an idea about the size of your In-Memory Neighbor Graph Vector Index in
memory, you can use the V$VECTOR_MEMORY_POOL view.
See Size the Vector Pool for more information about sizing the vector pool to allow
for vector index creation and maintenance

SQL> select CON_ID, POOL, ALLOC_BYTES/1024/1024 as ALLOC_BYTES_MB,

USED_BYTES/1024/1024 as USED_BYTES_MB from V$VECTOR_MEMORY_POOL order by 1,2;
10. Run an approximate similarity search to identify, within your books, the first
four most relevant chunks (Vector Index Search)
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
~~~~~~~~~~~~~~~~~~~~~~~~~~~

Use the VECTOR_DISTANCE function and the FETCH APPROX SQL clause to retrieve the
most similar chunks using your vector index

SELECT doc_id, chunk_id, chunk_data

FROM doc_chunks
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH APPROX FIRST 4 ROWS ONLY WITH TARGET ACCURACY 80;

SELECT doc_id, chunk_id, chunk_data

FROM doc_chunks
WHERE doc_id=1
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH APPROX FIRST 4 ROWS ONLY WITH TARGET ACCURACY 80;

EXPLAIN PLAN FOR

SELECT doc_id, chunk_id, chunk_data
FROM doc_chunks
ORDER BY vector_distance(chunk_embedding , :query_vector, COSINE)
FETCH APPROX FIRST 4 ROWS ONLY WITH TARGET ACCURACY 80;

select plan_table_output from table(dbms_xplan.display('plan_table',null,'all'));

11. Determine your vector index performance for your approximate similarity
searches
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
~~
After a vector index is created, you may be interested to know how accurate your
approximate vector searches are.
The index accuracy reporting feature allows you to determine the accuracy of your
vector indexes.

The DBMS_VECTOR.INDEX_ACCURACY_QUERY provides an accuracy report for a top-K index

search for a specific query vector and a specific target accuracy.

SQL>
SET SERVEROUTPUT ON
declare
report varchar2(128);
begin
report := dbms_vector.index_accuracy_query(
OWNER_NAME => 'VECTOR',
INDEX_NAME => 'DOCS_HNSW_IDX',
qv => :query_vector,
top_K => 10,
target_accuracy => 90 );
dbms_output.put_line(report);
end;
/

===================================================================================
=====================
A comprehensive example of importing pretrained ONNX embedding model and generating
vector embeddings
===================================================================================
=====================

$ sqlplus sys/<password>@<pdb_service_name> as sysdba

SQL> grant db_developer_role to dmuser identified by dmuser;
SQL> grant create mining model to dmuser;
SQL> create or replace directory DM_DUMP as '<work directory path>';
SQL> grant read on directory dm_dump to dmuser;
SQL> grant write on directory dm_dump to dmuser;

SQL> conn dmuser/<password>@<pdbname>;

SQL> –- Drop the model if it exits
SQL> exec DBMS_VECTOR.DROP_ONNX_MODEL(model_name => 'doc_model', force => true);
SQL> -- Load Model
SQL> EXECUTE DBMS_VECTOR.LOAD_ONNX_MODEL('DM_DUMP', 'my_embedding_model.onnx',
'doc_model', JSON('{"function" : "embedding", "embeddingOutput" : "embedding"}'));
SQL> --check the attributes view
SQL>
SELECT model_name, attribute_name, attribute_type, data_type, vector_info
FROM user_mining_model_attributes
WHERE model_name = 'DOC_MODEL'
ORDER BY ATTRIBUTE_NAME;
SQL>
SELECT MODEL_NAME, MINING_FUNCTION, ALGORITHM,
ALGORITHM_TYPE, MODEL_SIZE
FROM user_mining_models
WHERE model_name = 'DOC_MODEL'
ORDER BY MODEL_NAME;

SQL> select * from DM$VMDOC_MODEL ORDER BY NAME;

SQL> select * from DM$VPDOC_MODEL ORDER BY NAME;
SQL> select * from DM$VJDOC_MODEL;
SQL> --apply the model
SQL> SELECT TO_VECTOR(VECTOR_EMBEDDING(doc_model USING 'hello' as data)) AS
embedding;

Instead of DBMS_VECTOR package, you can also use DBMS_DATA_MINING package to import
the pretrained ONNX embedding model.
Use the DBMS_DATA_MINING.IMPORT_ONNX_MODEL procedure to import the model and
declare the input name.
The following code gives an example:

CONN dmuser/<password>@<pdbname>;
DECLARE
m_blob BLOB default empty_blob();
m_src_loc BFILE ;
BEGIN
DBMS_LOB.createtemporary (m_blob, FALSE);
m_src_loc := BFILENAME('DM_DUMP', 'my_embedding_model.onnx');
DBMS_LOB.fileopen (m_src_loc, DBMS_LOB.file_readonly);
DBMS_LOB.loadfromfile (m_blob, m_src_loc, DBMS_LOB.getlength (m_src_loc));
DBMS_LOB.CLOSE(m_src_loc);
DBMS_DATA_MINING.import_onnx_model ('doc_model', m_blob, JSON('{"function" :
"embedding", "embeddingOutput" : "embedding", "input": {"input": ["DATA"]}}'));
DBMS_LOB.freetemporary (m_blob);
END;
/

Which is having correct order of arguments value for

DBMS_DATA_MINING.IMPORT_ONNX_MODEL?
https://docs.oracle.com/en/database/oracle/oracle-database/23/vecse/alternate-
method-import-onnx-models.html
or
https://docs.oracle.com/en/database/oracle/oracle-database/23/arpls/
DBMS_DATA_MINING.html#GUID-17E2EC12-652D-4D2C-85F6-FA0F648105E4

Alternately, the DBMS_DATA_MINING.IMPORT_ONNX_MODEL procedure can also accept a

BLOB argument representing an ONNX file stored and loaded from OCI Object Storage.
The following is an example to load an ONNX model stored in an OCI Object Storage.

DECLARE
model_source BLOB := NULL;
BEGIN
-- get BLOB holding onnx model
model_source := DBMS_CLOUD.GET_OBJECT(
credential_name => 'myCredential',
object_uri => 'https://objectstorage.us-phoenix -1.oraclecloud.com/' ||
'n/namespace -string/b/bucketname/o/myONNXmodel.onnx');
DBMS_DATA_MINING.IMPORT_ONNX_MODEL(
"myonnxmodel",
model_source,
JSON('{ function : "embedding" })
);
END;
/

===================================================================================
=====================
A comprehensive example of importing pretrained ONNX embedding model using
DBMS_DATA_MINING package
===================================================================================
=====================

Instead of DBMS_VECTOR package, you can also use DBMS_DATA_MINING package to import
the pretrained ONNX embedding model.
The following code gives an example:

Use the DBMS_DATA_MINING.IMPORT_ONNX_MODEL procedure to import the model and

declare the input name.

$ sqlplus sys/<passwd>@<pdb_service_name> as sysdba

SQL> grant db_developer_role to dmuser identified by dmuser;
SQL> grant create mining model to dmuser;

SQL> create or replace directory DM_DUMP as '<work directory path>';

SQL> grant read on directory dm_dump to dmuser;
SQL> grant write on directory dm_dump to dmuser;
SQL> conn dmuser/<password>@<pdbname>;

SQL> -- drop the model if exists

SQL> exec DBMS_VECTOR.DROP_ONNX_MODEL(model_name => 'doc_model', force => true);

SQL> -- Load Model

SQL> --> Is the following syntax correct? Because the "my_embedding_model.onnx"
value is passed in 2nd parameter whereas previously it is passed in 1st parameter.
EXECUTE DBMS_DATA_MINING.IMPORT_ONNX_MODEL(
'my_embedding_model.onnx',
'doc_model',
JSON('{"function" : "embedding",
"embeddingOutput" : "embedding",
"input": {"input": ["DATA"]}}')
);

SQL> --check the attributes view

SQL>
SELECT model_name, attribute_name, attribute_type, data_type, vector_info
FROM user_mining_model_attributes
WHERE model_name = 'DOC_MODEL'
ORDER BY ATTRIBUTE_NAME;

===================================================================================
=====================
EASY TO UNDERSTAND EXAMPLE WITHOUT THE PDF DOCUMENT SCENARIO. DIRECT TEXT CONTENT
SCENARIO
===================================================================================
=====================

conn sys/password@CDB_PDB as sysdba

CREATE TABLESPACE tbs1

DATAFILE 'tbs5.dbf' SIZE 20G AUTOEXTEND ON
EXTENT MANAGEMENT LOCAL
SEGMENT SPACE MANAGEMENT AUTO;

drop user docuser cascade;

create user docuser identified by docuser DEFAULT TABLESPACE tbs1 quota unlimited
on tbs1;
grant DB_DEVELOPER_ROLE to docuser;

create or replace directory VEC_DUMP as '/my_local_dir/';

grant read, write on directory VEC_DUMP to docuser;
commit;

conn docuser/password@CDB_PDB;
SET ECHO ON
SET FEEDBACK 1
SET NUMWIDTH 10
SET LINESIZE 80
SET TRIMSPOOL ON
SET TAB OFF
SET PAGESIZE 10000
SET LONG 10000

drop table documentation_tab purge;

create table documentation_tab (id number, text clob);

insert into documentation_tab values (1,

'Analytics empowers business analysts and consumers with modern, AI-powered,
self-service analytics capabilities for data preparation, visualization, enterprise
reporting, augmented analysis, and natural language processing.
Oracle Analytics Cloud is a scalable and secure public cloud service that
provides capabilities to explore and perform collaborative analytics for you, your
workgroup, and your enterprise.

Oracle Analytics Cloud is available on Oracle Cloud Infrastructure Gen 2 in

several regions in North America, EMEA, APAC, and LAD when you subscribe through
Universal Credits. You can subscribe to Professional Edition or Enterprise
Edition.');

insert into documentation_tab values (3,

'Generative AI Data Science is a fully managed and serverless platform for data
science teams to build, train, and manage machine learning models in the Oracle
Cloud Infrastructure.');

insert into documentation_tab values (4,

'Language allows you to perform sophisticated text analysis at scale. Using the
pretrained and custom models, you can process unstructured text to extract insights
without data science expertise.
Pretrained models include sentiment analysis, key phrase extraction, text
classification, and named entity recognition. You can also train custom models for
named entity recognition and text
classification with domain specific datasets. Additionally, you can translate
text across numerous languages.');

insert into documentation_tab values (5,

'When you work with Oracle Cloud Infrastructure, one of the first steps is to
set up a virtual cloud network (VCN) for your cloud resources. This topic gives you
an overview of Oracle Cloud
Infrastructure Networking components and typical scenarios for using a VCN. A
virtual, private network that you set up in Oracle data centers. It closely
resembles a traditional network, with
firewall rules and specific types of communication gateways that you can
choose to use. A VCN resides in a single Oracle Cloud Infrastructure region and
covers one or more CIDR blocks
(IPv4 and IPv6, if enabled). See Allowed VCN Size and Address Ranges. The
terms virtual cloud network, VCN, and cloud network are used interchangeably in
this documentation.
For more information, see VCNs and Subnets.');

insert into documentation_tab values (6,

'NetSuite banking offers several processing options to accurately track your
income. You can record deposits to your bank accounts to capture customer payments
and other monies received in the
course of doing business. For a deposit, you can select payments received for
existing transactions, add funds not related to transaction payments, and record
any cash received back from the bank.');

commit;

EXECUTE dbms_vector.drop_onnx_model(model_name => 'doc_model', force => true);

EXECUTE dbms_vector.load_onnx_model(
'VEC_DUMP',
'my_embedding_model.onnx',
'doc_model',
json('{"function" : "embedding", "embeddingOutput" : "embedding" , "input":
{"input": ["DATA"]}}')
);

create table doc_chunks as (

SELECT d.id id,
row_number() over (partition by d.id order by d.id) chunk_id,
vc.chunk_offset chunk_offset,
vc.chunk_length chunk_length,
vc.chunk_text chunk,
vector_embedding(doc_model using vc.chunk_text as data) vector
FROM documentation_tab d,
vector_chunks(d.text by words max 100 overlap 10 split RECURSIVELY) vc
);

desc doc_chunks;
set linesize 100
set long 1000
col id for 999
col chunk_id for 99999
col chunk_offset for 99999
col chunk_length for 99999
col chunk for a30
col vector for a100
select id, chunk_id, chunk_offset, chunk_length, chunk from doc_chunks;
select vector from doc_chunks where rownum <= 1;

create vector index vidx on doc_chunks (vector)

organization neighbor partitions
with target accuracy 95
distance EUCLIDEAN parameters (
type IVF,
neighbor partitions 2);

select id, vector_distance(

vector,
vector_embedding(doc_model using 'machine learning models' as data),
EUCLIDEAN) results
FROM doc_chunks order by results;

select id, vector_distance(

vector,
vector_embedding(doc_model using 'gen ai' as data),
EUCLIDEAN) results
FROM doc_chunks order by results;

select id, vector_distance(

vector,
vector_embedding(doc_model using 'computing networks' as data),
MANHATTAN) results
FROM doc_chunks order by results;

select id, vector_distance(

vector,
vector_embedding(doc_model using 'banking, money' as data),
MANHATTAN) results
FROM doc_chunks order by results;

===================================================================================
=====================
SQL RAG EXAMPLE
===================================================================================
=====================

This scenario allows you to run a similarity search for specific documentation
content based on a user query.
Once documentation chunks are retrieved, they are concatenated and a prompt is
generated to ask an LLM to answer the user question
using retrieved chunks.
+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
++
conn sys/password AS sysdba

SET SERVEROUTPUT ON;

SET ECHO ON;
SET LONG 100000;

DROP USER vector cascade;

CREATE USER vector identified by <my vector password>
GRANT DB_DEVELOPER_ROLE, CREATE CREDENTIAL TO vector;

EXEC UTL_HTTP.SET_PROXY('<my proxy full name>:<my proxy port>');

BEGIN
DBMS_NETWORK_ACL_ADMIN.APPEND_HOST_ACE(
host => '*',
ace => xs$ace_type(privilege_list => xs$name_list('connect'),
principal_name => 'VECTOR',
principal_type => xs_acl.ptype_db));
END;
/

conn docuser/password;

-- Create a credential for Oracle Cloud Infrastructure Generative AI

BEGIN
DBMS_VECTOR_CHAIN.DROP_CREDENTIAL(credential_name => 'OCI_CRED');
EXCEPTION
WHEN OTHERS THEN NULL;
END;
/

DECLARE
jo json_object_t;
BEGIN
jo := json_object_t();
jo.put('user_ocid', '<user ocid>');
jo.put('tenancy_ocid', '<tenancy ocid>');
jo.put('compartment_ocid', '<compartment ocid>');
jo.put('private_key', '<private key>');
jo.put('fingerprint', '<fingerprint>');
DBMS_OUTPUT.PUT_LINE(jo.to_string);
DBMS_VECTOR_CHAIN.CREATE_CREDENTIAL(
credential_name => 'OCID_CRED',
params => json(jo.to_string));
END;
/

col owner format a15

col credential_name format a20
col username format a20

SELECT owner, credential_name, username

FROM all_credentials
ORDER BY owner, credential_name, username;

SET SERVEROUTPUT ON;

VAR prompt CLOB;
VAR user_question CLOB;
VAR context CLOB;
BEGIN
-- initialize the concatenated string
:context := '';
-- read this question from the user
:user_question := 'what are vector indexes?';
-- cursor to fetch chunks relevant to the user's query
FOR rec IN (SELECT EMBED_DATA
FROM DOC_ID = 'Vector User Guide'
ORDER BY vector_distance(embed_vector, vector_embedding(
doc_model using :user_question as input), COSINE)
FETCH EXACT FIRST 10 ROWS ONLY)
LOOP
-- concatenate each value to the string
:context := :context || rec.embed_data;
END LOOP;
-- concatenate strings and format it as an enhanced prompt to the LLM
:prompt := 'Answer the following question using the supplied context
assuming you are a subject matter expert. Question: '
|| :user_question || ' Context: ' || :context;
DBMS_OUTPUT.PUT_LINE('Generated prompt: ' || :prompt);
END;
/

DECLARE
input CLOB;
params CLOB;
output CLOB;
BEGIN
input := :prompt;
params := '{
"provider" : "ocigenai",
"credential_name" : "OCI_CRED",
"url" :
https://inference.generativeai.us-chicago-1.oci.oraclecloud.com/20231130/actions/
generateText,
"model" : "cohere.command"
}';
output := DBMS_VECTOR_CHAIN.UTL_TO_GENERATE_TEXT(input, json(params));
DBMS_OUTPUT.PUT_LINE(output);
IF output IS NOT NULL THEN
DBMS_LOB.FREETEMPORARY(output);
END IF;
EXCEPTION
WHEN OTHERS THEN
DBMS_OUTPUT.PUT_LINE(SQLERRM);
DBMS_OUTPUT.PUT_LINE(SQLCODE);
END;
/
+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
++

1Z0-184-25 - Oracle AI Vector Search Professional (DUMPS)
No ratings yet
1Z0-184-25 - Oracle AI Vector Search Professional (DUMPS)
105 pages
1Z0-184-25
No ratings yet
1Z0-184-25
143 pages
Oracle DBA Interview Questions and Answers
No ratings yet
Oracle DBA Interview Questions and Answers
46 pages
Job alert
No ratings yet
Job alert
269 pages
Deloitte Interview Questions for OIC
No ratings yet
Deloitte Interview Questions for OIC
2 pages
oracle scripts and scripts
No ratings yet
oracle scripts and scripts
151 pages
Low Code Programming with APEX
No ratings yet
Low Code Programming with APEX
382 pages
INT108 -Integration Technical Design - Culture AMP Employee Details_v0.2
No ratings yet
INT108 -Integration Technical Design - Culture AMP Employee Details_v0.2
22 pages
Data Migration - Automation Tools DMF_v1.5
No ratings yet
Data Migration - Automation Tools DMF_v1.5
63 pages
Configure Approval NotificationBI
No ratings yet
Configure Approval NotificationBI
36 pages
Oracle OCI Interview Questions and Answers
No ratings yet
Oracle OCI Interview Questions and Answers
21 pages
krithi-talk-impact.pptx
No ratings yet
krithi-talk-impact.pptx
169 pages
Oracle Cloud Technical Lead
No ratings yet
Oracle Cloud Technical Lead
6 pages
1z0-149 (Final)
No ratings yet
1z0-149 (Final)
41 pages
OIC Training - Day 1 of 5
No ratings yet
OIC Training - Day 1 of 5
10 pages
M1222 - Account Receivables (AR) Document
No ratings yet
M1222 - Account Receivables (AR) Document
74 pages
OIC-ver1
No ratings yet
OIC-ver1
22 pages
Vector Search Theoritical Notes With Keywords
No ratings yet
Vector Search Theoritical Notes With Keywords
36 pages
Chrissi Jo: Printing Cleo Collection
No ratings yet
Chrissi Jo: Printing Cleo Collection
19 pages
M1222 - Discrete Manufacturing Setup Document
No ratings yet
M1222 - Discrete Manufacturing Setup Document
24 pages
Oracle Visual Builder Cloud Service QA
No ratings yet
Oracle Visual Builder Cloud Service QA
19 pages
HCM – Basic Understanding of HDL – Worker.dat
No ratings yet
HCM – Basic Understanding of HDL – Worker.dat
19 pages
Oracle 12c Creating SecureFile LOBs On Import
100% (1)
Oracle 12c Creating SecureFile LOBs On Import
1 page
Python Workshop Notes - 4104839 - 2023 - 03 - 19 - 22 - 31
No ratings yet
Python Workshop Notes - 4104839 - 2023 - 03 - 19 - 22 - 31
90 pages
PDF
No ratings yet
PDF
48 pages
Streamlit PDF Application Setup All Commands in One Single File
No ratings yet
Streamlit PDF Application Setup All Commands in One Single File
8 pages
Technical Analyzer Trading Stocks 20240930 Retail Research H
No ratings yet
Technical Analyzer Trading Stocks 20240930 Retail Research H
4 pages
Parndorf Store Guide
No ratings yet
Parndorf Store Guide
1 page
PgDay 2017 Innodb Architecture Performance Optimization
No ratings yet
PgDay 2017 Innodb Architecture Performance Optimization
175 pages
Future of Procurement
No ratings yet
Future of Procurement
19 pages
Introduction To SQL, SQL Plus, and SQL Developer
No ratings yet
Introduction To SQL, SQL Plus, and SQL Developer
32 pages
Oracle Notes
No ratings yet
Oracle Notes
7 pages
Oracle Integrated Cloud Service
No ratings yet
Oracle Integrated Cloud Service
39 pages
Ar Receipt Api Pub PDF
No ratings yet
Ar Receipt Api Pub PDF
5 pages
Caterpillar 977k Track Loader Service Manual | PDF Download
No ratings yet
Caterpillar 977k Track Loader Service Manual | PDF Download
33 pages
The Chemistry of The Colorful Fire
No ratings yet
The Chemistry of The Colorful Fire
9 pages
Oracle PT Queries
No ratings yet
Oracle PT Queries
19 pages
Oracle AR summary
No ratings yet
Oracle AR summary
7 pages
Vertica Column-vs-Row
No ratings yet
Vertica Column-vs-Row
64 pages
Inventory Dumps
No ratings yet
Inventory Dumps
210 pages
Reports Messages and Codes Manual
No ratings yet
Reports Messages and Codes Manual
221 pages
Lab Experiment For Synchro Transmitter and Receiver PDF
100% (1)
Lab Experiment For Synchro Transmitter and Receiver PDF
8 pages
OCI Course Contents
No ratings yet
OCI Course Contents
8 pages
rowley2002
No ratings yet
rowley2002
8 pages
Say Goodbye To Hard-Coding
No ratings yet
Say Goodbye To Hard-Coding
34 pages
Fusion Applications: 14 July 2010
No ratings yet
Fusion Applications: 14 July 2010
50 pages
Thesis Topics Related To Landscape Architecture
100% (3)
Thesis Topics Related To Landscape Architecture
5 pages
The Tuh Eeg Corpus
No ratings yet
The Tuh Eeg Corpus
5 pages
Plain Language ICF Template
No ratings yet
Plain Language ICF Template
11 pages
64209
No ratings yet
64209
80 pages
Lab 4 - Tablespace & Datafile
No ratings yet
Lab 4 - Tablespace & Datafile
18 pages
MAGNETIC EFFECTS OF ELECTRIC CURRENT -Mod2_WS_1
No ratings yet
MAGNETIC EFFECTS OF ELECTRIC CURRENT -Mod2_WS_1
2 pages
Employment
No ratings yet
Employment
9 pages
Log
100% (1)
Log
13 pages
Script Submit Bank Statement Loader
No ratings yet
Script Submit Bank Statement Loader
8 pages
Fingerprint 1
No ratings yet
Fingerprint 1
5 pages
Streams 2 GG
No ratings yet
Streams 2 GG
59 pages
A Chemistry Laboratory Platform Enhanced With Virtual Reality For Students' Adaptive Learning
No ratings yet
A Chemistry Laboratory Platform Enhanced With Virtual Reality For Students' Adaptive Learning
10 pages
Sprinkler Irrigation System For 1 Acre Land
No ratings yet
Sprinkler Irrigation System For 1 Acre Land
4 pages
AP Invoice Full
No ratings yet
AP Invoice Full
12 pages
TCA API's Samples
No ratings yet
TCA API's Samples
17 pages
SSIS 2008 Tutorial
No ratings yet
SSIS 2008 Tutorial
32 pages
1z0-1042-24(Updated-Latest-Final)
No ratings yet
1z0-1042-24(Updated-Latest-Final)
37 pages
4423 How To Configure Oracle Forms Monitoring
No ratings yet
4423 How To Configure Oracle Forms Monitoring
6 pages
Talent Acquisition
No ratings yet
Talent Acquisition
60 pages
Links
No ratings yet
Links
5 pages
ADB Lab Manual
No ratings yet
ADB Lab Manual
33 pages
Latihan Soal Pas
No ratings yet
Latihan Soal Pas
15 pages
Dharmshala McLeodganj 5 Days 4 Nights R1
No ratings yet
Dharmshala McLeodganj 5 Days 4 Nights R1
6 pages
Api Use r12
No ratings yet
Api Use r12
32 pages
Conditional Statements and Loops in Visual Basic
No ratings yet
Conditional Statements and Loops in Visual Basic
9 pages
Random Variables and Probability Distribution: Purnomo Jurusan Teknik Mesin UGM
No ratings yet
Random Variables and Probability Distribution: Purnomo Jurusan Teknik Mesin UGM
48 pages
Exchange Filters Difiltro PRODUTOS E APLICA ES
No ratings yet
Exchange Filters Difiltro PRODUTOS E APLICA ES
30 pages
TOP 70 Oracle Financial Interview Questions (2023)
100% (2)
TOP 70 Oracle Financial Interview Questions (2023)
13 pages
Pricing and Tax Determination - SAP SD
No ratings yet
Pricing and Tax Determination - SAP SD
5 pages
Electronic Arts End User License Agreement
No ratings yet
Electronic Arts End User License Agreement
5 pages
Elster AL425 Diaphragm Meter
No ratings yet
Elster AL425 Diaphragm Meter
2 pages
List of Countries, Nationalities and Their Languages: Country Nationality (Adjective) Nationailty (Noun) Language
No ratings yet
List of Countries, Nationalities and Their Languages: Country Nationality (Adjective) Nationailty (Noun) Language
4 pages
Improve Security in Oracle EBS and Prepare For Fusion Cloud Collaborate 15 WP
No ratings yet
Improve Security in Oracle EBS and Prepare For Fusion Cloud Collaborate 15 WP
16 pages
Egary 32q Vce PDF
No ratings yet
Egary 32q Vce PDF
5 pages
Integrating Apex With Bi Publisher 169198
No ratings yet
Integrating Apex With Bi Publisher 169198
19 pages
Attunity Oracle-CDC For SSIS - Sample Tutorial
100% (1)
Attunity Oracle-CDC For SSIS - Sample Tutorial
12 pages
Philippines Environmental Laws and Policies
No ratings yet
Philippines Environmental Laws and Policies
3 pages
Fuel Oil and Diesel Oil Service Systems
No ratings yet
Fuel Oil and Diesel Oil Service Systems
2 pages
BCS 042
No ratings yet
BCS 042
4 pages
Oracle Blog
No ratings yet
Oracle Blog
5 pages
101 Best Microsoft Excel Tips & Tricks Ebook v1.3 - LM
96% (26)
101 Best Microsoft Excel Tips & Tricks Ebook v1.3 - LM
616 pages
The 27 Body Transformation Habits
97% (37)
The 27 Body Transformation Habits
185 pages
SQL - With Practice Exercises, Learn SQL Fast (PDFDrive) PDF
100% (3)
SQL - With Practice Exercises, Learn SQL Fast (PDFDrive) PDF
167 pages
Advanced Excel Tutorial
98% (48)
Advanced Excel Tutorial
232 pages
Oracle Fusion Cloud Financials
25% (4)
Oracle Fusion Cloud Financials
12 pages
Learn To Speak Spanish - Workbook
95% (55)
Learn To Speak Spanish - Workbook
170 pages
Scholastic Success With Reading Comprehension Grade 4
96% (24)
Scholastic Success With Reading Comprehension Grade 4
72 pages
1Z0 1055 22 - Correction
100% (5)
1Z0 1055 22 - Correction
67 pages
240 Vocabulary Words Grade 3 Scholastic
86% (44)
240 Vocabulary Words Grade 3 Scholastic
81 pages
How To Talk So Kids Will Listen and Listen So Kids Will Talk (Excerpt)
35% (260)
How To Talk So Kids Will Listen and Listen So Kids Will Talk (Excerpt)
38 pages
New Scholastic Comprehsion Skills Grade 3 PDF
97% (31)
New Scholastic Comprehsion Skills Grade 3 PDF
49 pages
Powerful - Vocabulary.for - Reading.success Student's.edition Grade.4 204p
96% (69)
Powerful - Vocabulary.for - Reading.success Student's.edition Grade.4 204p
204 pages
TRAF Oracle Cloud ERP Cash Management Security Design - Draft - v2.3
No ratings yet
TRAF Oracle Cloud ERP Cash Management Security Design - Draft - v2.3
180 pages
Oracle Projects (Cons)
100% (1)
Oracle Projects (Cons)
115 pages
1Z0-1055-22 - Payables Cloud 2022
100% (1)
1Z0-1055-22 - Payables Cloud 2022
39 pages
Saleemullah - Resume
No ratings yet
Saleemullah - Resume
4 pages
Setting Up Multi Org Structure in R12 (MOAC) - ALL ORACLE APPS
100% (1)
Setting Up Multi Org Structure in R12 (MOAC) - ALL ORACLE APPS
68 pages
TWSB Dynamics User Training Material V1 1
No ratings yet
TWSB Dynamics User Training Material V1 1
107 pages
Oracle DBA On Unix and Linux
No ratings yet
Oracle DBA On Unix and Linux
599 pages
BI Trouble Shotting (364547.1)
No ratings yet
BI Trouble Shotting (364547.1)
13 pages
BI Publisher and APEX The Next Dimension of Oracle Reports
No ratings yet
BI Publisher and APEX The Next Dimension of Oracle Reports
16 pages
Oracle Material
No ratings yet
Oracle Material
90 pages
Oracle Apps
No ratings yet
Oracle Apps
98 pages
Module 3, Day 1
No ratings yet
Module 3, Day 1
21 pages
A Part of AR Interview Questions and Answers
No ratings yet
A Part of AR Interview Questions and Answers
6 pages
Oracle Essbase 9 Implementation Guide
From Everand
Oracle Essbase 9 Implementation Guide
Joseph Sydney Gomez
No ratings yet
IBM InfoSphere Replication Server and Data Event Publisher
From Everand
IBM InfoSphere Replication Server and Data Event Publisher
Pav Kumar-Chatterjee
No ratings yet
Oracle Essbase 11 Development Cookbook
From Everand
Oracle Essbase 11 Development Cookbook
Jose R. Ruiz
No ratings yet
TIBCO Software The Ultimate Step-By-Step Guide
From Everand
TIBCO Software The Ultimate Step-By-Step Guide
Gerardus Blokdyk
No ratings yet
Oracle Exadata Complete Self-Assessment Guide
From Everand
Oracle Exadata Complete Self-Assessment Guide
Gerardus Blokdyk
No ratings yet
ORACLE 12C Complete Self-Assessment Guide
From Everand
ORACLE 12C Complete Self-Assessment Guide
Gerardus Blokdyk
No ratings yet

Vector Search Demo Commands

Uploaded by

Vector Search Demo Commands

Uploaded by

@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@

CREATE TABLE house_for_sale (house_id NUMBER,

1. Create Tablespace, DB User and Grant privileges

$ sqlplus sys/<passwd>@<pdb_service_name> as sysdba

SQL> CREATE TABLESPACE tbs1 DATAFILE 'tbs5.dbf' SIZE 5G AUTOEXTEND ON EXTENT

SQL> drop user vector cascade;

SQL> create or replace directory VEC_DUMP as '/tmp/my_local_dir/';

2. Load your embedding model into the Oracle Database

Syntax: exec dbms_vector.drop_onnx_model(model_name =>

SQL> exec dbms_vector.drop_onnx_model(model_name => 'doc_model', force => true);

3. Create a relational table to store books in the PDF format

SQL> drop table documentation_tab purge;

4. Create a relational table to store unstructured data chunks and associated

SQL> drop table doc_chunks purge;

Syntax for DBMS_VECTOR_CHAIN.UTL_TO_EMBEDDINGS: -- Converts data to one or more

Syntax for DBMS_VECTOR_CHAIN.UTL_TO_CHUNKS: -- Splits data into smaller pieces or

Syntax for DBMS_VECTOR_CHAIN.UTL_TO_TEXT: -- Extracts plain text data from

5. Generate a query vector for use in a similarity search

SQL> ACCEPT text_input CHAR PROMPT 'Enter text: '

SQL> VARIABLE text_variable VARCHAR2(1000)

SELECT doc_id, chunk_id, chunk_data

SELECT doc_id, chunk_id, chunk_data

EXPLAIN PLAN FOR

SELECT doc_id, chunk_id, chunk_data

create vector index docs_hnsw_idx on doc_chunks(chunk_embedding)

SQL> SELECT INDEX_NAME, INDEX_TYPE, INDEX_SUBTYPE FROM USER_INDEXES;

INDEX_NAME INDEX_TYPE INDEX_SUBTYPE

SELECT JSON_SERIALIZE(IDX_PARAMS returning varchar2 PRETTY) FROM

9. Determine the memory allocation in the vector memory area

SQL> select CON_ID, POOL, ALLOC_BYTES/1024/1024 as ALLOC_BYTES_MB,

SELECT doc_id, chunk_id, chunk_data

SELECT doc_id, chunk_id, chunk_data

EXPLAIN PLAN FOR

select plan_table_output from table(dbms_xplan.display('plan_table',null,'all'));

The DBMS_VECTOR.INDEX_ACCURACY_QUERY provides an accuracy report for a top-K index

$ sqlplus sys/<password>@<pdb_service_name> as sysdba

SQL> conn dmuser/<password>@<pdbname>;

SQL> select * from DM$VMDOC_MODEL ORDER BY NAME;

Which is having correct order of arguments value for

Alternately, the DBMS_DATA_MINING.IMPORT_ONNX_MODEL procedure can also accept a

Use the DBMS_DATA_MINING.IMPORT_ONNX_MODEL procedure to import the model and

$ sqlplus sys/<passwd>@<pdb_service_name> as sysdba

SQL> create or replace directory DM_DUMP as '<work directory path>';

SQL> -- drop the model if exists

SQL> -- Load Model

SQL> --check the attributes view

conn sys/password@CDB_PDB as sysdba

CREATE TABLESPACE tbs1

drop user docuser cascade;

create or replace directory VEC_DUMP as '/my_local_dir/';

drop table documentation_tab purge;

insert into documentation_tab values (1,

Oracle Analytics Cloud is available on Oracle Cloud Infrastructure Gen 2 in

insert into documentation_tab values (3,

insert into documentation_tab values (4,

insert into documentation_tab values (5,

insert into documentation_tab values (6,

EXECUTE dbms_vector.drop_onnx_model(model_name => 'doc_model', force => true);

create table doc_chunks as (

create vector index vidx on doc_chunks (vector)

select id, vector_distance(

select id, vector_distance(

select id, vector_distance(

select id, vector_distance(

SET SERVEROUTPUT ON;

DROP USER vector cascade;

EXEC UTL_HTTP.SET_PROXY('<my proxy full name>:<my proxy port>');

-- Create a credential for Oracle Cloud Infrastructure Generative AI

col owner format a15

SELECT owner, credential_name, username

SET SERVEROUTPUT ON;

You might also like