Skip to content
Projects
Groups
Snippets
Help
This project
Loading...
Sign in / Register
Toggle navigation
T
tic
Overview
Overview
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
wenyuanbo
tic
Commits
4d2fc952
Commit
4d2fc952
authored
Nov 12, 2017
by
Tianqi Chen
Committed by
GitHub
Nov 12, 2017
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
[PASS] Fix vthread when extern access touching (#636)
parent
b07ceff5
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
76 additions
and
8 deletions
+76
-8
src/pass/inject_virtual_thread.cc
+42
-8
tests/python/unittest/test_pass_inject_vthread.py
+34
-0
No files found.
src/pass/inject_virtual_thread.cc
View file @
4d2fc952
...
@@ -15,11 +15,12 @@ namespace ir {
...
@@ -15,11 +15,12 @@ namespace ir {
// If expression is touched by var.
// If expression is touched by var.
class
ExprTouched
final
:
public
IRVisitor
{
class
ExprTouched
final
:
public
IRVisitor
{
public
:
public
:
explicit
ExprTouched
(
const
std
::
unordered_set
<
const
Variable
*>
&
touched
)
explicit
ExprTouched
(
const
std
::
unordered_set
<
const
Variable
*>
&
touched
,
:
touched_var_
(
touched
)
{}
bool
check_write
)
:
touched_var_
(
touched
),
check_write_
(
check_write
)
{}
void
Visit
(
const
NodeRef
&
n
)
final
{
void
Visit
(
const
NodeRef
&
n
)
final
{
// early stopping
// early stopping
if
(
expr_touched_
)
return
;
if
(
expr_touched_
&&
!
check_write_
)
return
;
IRVisitor
::
Visit
(
n
);
IRVisitor
::
Visit
(
n
);
}
}
void
Visit_
(
const
Load
*
op
)
final
{
void
Visit_
(
const
Load
*
op
)
final
{
...
@@ -29,6 +30,24 @@ class ExprTouched final : public IRVisitor {
...
@@ -29,6 +30,24 @@ class ExprTouched final : public IRVisitor {
void
Visit_
(
const
Variable
*
op
)
final
{
void
Visit_
(
const
Variable
*
op
)
final
{
HandleUseVar
(
op
);
HandleUseVar
(
op
);
}
}
void
Visit_
(
const
Call
*
op
)
final
{
if
(
op
->
is_intrinsic
(
intrinsic
::
tvm_access_ptr
))
{
int
rw_mask
;
CHECK
(
arith
::
GetConstInt
(
op
->
args
[
4
],
&
rw_mask
));
const
Variable
*
buffer_var
=
op
->
args
[
1
].
as
<
Variable
>
();
CHECK
(
buffer_var
);
// read
if
(
rw_mask
&
1
)
{
HandleUseVar
(
buffer_var
);
}
if
(
rw_mask
&
2
)
{
HandleWriteVar
(
buffer_var
);
}
this
->
Visit
(
op
->
args
[
2
]);
}
else
{
IRVisitor
::
Visit_
(
op
);
}
}
void
HandleUseVar
(
const
Variable
*
var
)
{
void
HandleUseVar
(
const
Variable
*
var
)
{
auto
it
=
touched_var_
.
find
(
var
);
auto
it
=
touched_var_
.
find
(
var
);
if
(
it
!=
touched_var_
.
end
())
{
if
(
it
!=
touched_var_
.
end
())
{
...
@@ -40,36 +59,49 @@ class ExprTouched final : public IRVisitor {
...
@@ -40,36 +59,49 @@ class ExprTouched final : public IRVisitor {
used_vars_
.
push_back
(
var
);
used_vars_
.
push_back
(
var
);
}
}
}
}
void
HandleWriteVar
(
const
Variable
*
var
)
{
write_vars_
.
push_back
(
var
);
}
// the fields.
// the fields.
bool
expr_touched_
{
false
};
bool
expr_touched_
{
false
};
std
::
vector
<
const
Variable
*>
used_vars_
;
std
::
vector
<
const
Variable
*>
used_vars_
;
std
::
vector
<
const
Variable
*>
write_vars_
;
const
std
::
unordered_set
<
const
Variable
*>&
touched_var_
;
const
std
::
unordered_set
<
const
Variable
*>&
touched_var_
;
bool
check_write_
;
};
};
// Analyze if the buffers are invariant to value of var
// Analyze if the buffers are invariant to value of var
class
VarTouchedAnalysis
:
public
IRVisitor
{
class
VarTouchedAnalysis
:
public
IRVisitor
{
public
:
public
:
void
Visit_
(
const
LetStmt
*
op
)
{
void
Visit_
(
const
LetStmt
*
op
)
{
ExprTouched
tc
(
touched_var_
);
ExprTouched
tc
(
touched_var_
,
false
);
tc
.
Visit
(
op
->
value
);
tc
.
Visit
(
op
->
value
);
Record
(
op
->
var
.
get
(),
tc
);
Record
(
op
->
var
.
get
(),
tc
);
this
->
Visit
(
op
->
body
);
this
->
Visit
(
op
->
body
);
}
}
void
Visit_
(
const
Store
*
op
)
{
void
Visit_
(
const
Store
*
op
)
{
ExprTouched
tc
(
touched_var_
);
ExprTouched
tc
(
touched_var_
,
false
);
tc
.
Visit
(
op
->
value
);
tc
.
Visit
(
op
->
value
);
tc
.
Visit
(
op
->
index
);
tc
.
Visit
(
op
->
index
);
Record
(
op
->
buffer_var
.
get
(),
tc
);
Record
(
op
->
buffer_var
.
get
(),
tc
);
}
}
void
Visit_
(
const
For
*
op
)
{
void
Visit_
(
const
For
*
op
)
{
ExprTouched
tc
(
touched_var_
);
ExprTouched
tc
(
touched_var_
,
false
);
tc
.
Visit
(
op
->
min
);
tc
.
Visit
(
op
->
min
);
tc
.
Visit
(
op
->
extent
);
tc
.
Visit
(
op
->
extent
);
Record
(
op
->
loop_var
.
get
(),
tc
);
Record
(
op
->
loop_var
.
get
(),
tc
);
this
->
Visit
(
op
->
body
);
this
->
Visit
(
op
->
body
);
}
}
// external function call
void
Visit_
(
const
Evaluate
*
op
)
{
ExprTouched
tc
(
touched_var_
,
true
);
tc
.
Visit
(
op
->
value
);
for
(
const
Variable
*
var
:
tc
.
write_vars_
)
{
Record
(
var
,
tc
);
}
}
void
Visit_
(
const
Allocate
*
op
)
{
void
Visit_
(
const
Allocate
*
op
)
{
ExprTouched
tc
(
touched_var_
);
ExprTouched
tc
(
touched_var_
,
false
);
for
(
size_t
i
=
0
;
i
<
op
->
extents
.
size
();
++
i
)
{
for
(
size_t
i
=
0
;
i
<
op
->
extents
.
size
();
++
i
)
{
tc
.
Visit
(
op
->
extents
[
i
]);
tc
.
Visit
(
op
->
extents
[
i
]);
}
}
...
@@ -87,7 +119,9 @@ class VarTouchedAnalysis : public IRVisitor {
...
@@ -87,7 +119,9 @@ class VarTouchedAnalysis : public IRVisitor {
touched_var_
.
insert
(
var
);
touched_var_
.
insert
(
var
);
}
else
{
}
else
{
for
(
const
Variable
*
r
:
tc
.
used_vars_
)
{
for
(
const
Variable
*
r
:
tc
.
used_vars_
)
{
affect_
[
r
].
push_back
(
var
);
if
(
r
!=
var
)
{
affect_
[
r
].
push_back
(
var
);
}
}
}
}
}
}
}
...
...
tests/python/unittest/test_pass_inject_vthread.py
View file @
4d2fc952
...
@@ -28,5 +28,39 @@ def test_vthread():
...
@@ -28,5 +28,39 @@ def test_vthread():
stmt
=
tvm
.
ir_pass
.
InjectVirtualThread
(
get_vthread
(
"cthread"
))
stmt
=
tvm
.
ir_pass
.
InjectVirtualThread
(
get_vthread
(
"cthread"
))
assert
len
(
stmt
.
body
.
body
.
extents
)
==
3
assert
len
(
stmt
.
body
.
body
.
extents
)
==
3
def
test_vthread_extern
():
dtype
=
'int64'
n
=
100
m
=
4
nthread
=
2
def
get_vthread
(
name
):
tx
=
tvm
.
thread_axis
(
name
)
ty
=
tvm
.
thread_axis
(
name
)
ib
=
tvm
.
ir_builder
.
create
()
with
ib
.
for_range
(
0
,
n
)
as
i
:
ib
.
scope_attr
(
tx
,
"virtual_thread"
,
nthread
)
ib
.
scope_attr
(
ty
,
"virtual_thread"
,
nthread
)
A
=
ib
.
allocate
(
"float32"
,
m
,
name
=
"A"
,
scope
=
"shared"
)
B
=
ib
.
allocate
(
"float32"
,
m
,
name
=
"B"
,
scope
=
"shared"
)
C
=
ib
.
allocate
(
"float32"
,
m
,
name
=
"C"
,
scope
=
"shared"
)
cbuffer
=
tvm
.
decl_buffer
((
m
,),
dtype
=
C
.
dtype
,
data
=
C
.
asnode
())
abuffer
=
tvm
.
decl_buffer
((
m
,),
dtype
=
A
.
dtype
,
data
=
A
.
asnode
())
bbuffer
=
tvm
.
decl_buffer
((
m
,),
dtype
=
B
.
dtype
,
data
=
B
.
asnode
())
A
[
tx
]
=
tx
+
1.0
B
[
ty
]
=
ty
+
1.0
ib
.
emit
(
tvm
.
call_extern
(
"int32"
,
"Run"
,
abuffer
.
access_ptr
(
"r"
),
bbuffer
.
access_ptr
(
"r"
),
cbuffer
.
access_ptr
(
"rw"
)))
return
ib
.
get
()
stmt
=
tvm
.
ir_pass
.
InjectVirtualThread
(
get_vthread
(
"vthread"
))
assert
stmt
.
body
.
body
.
extents
[
0
]
.
value
==
2
assert
stmt
.
body
.
body
.
body
.
body
.
body
.
body
.
extents
[
0
]
.
value
==
2
assert
len
(
stmt
.
body
.
body
.
body
.
body
.
body
.
body
.
extents
)
==
3
if
__name__
==
"__main__"
:
if
__name__
==
"__main__"
:
test_vthread_extern
()
test_vthread
()
test_vthread
()
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment